Comparison

util-src/encodings.c @ 3769:9338d0785277

util-src/Makefile, util-src/encodings.c{,pp}: Port ICU code to C, rename encodings.cpp back to .c and amend the Makefile accordingly
author Matthew Wild <mwild1@gmail.com>
date Fri, 17 Dec 2010 22:32:21 +0000
parent 3764:util-src/encodings.cpp@323169f229fa
child 3965:4ae4b2c0e99d
comparison
equal deleted inserted replaced
3768:01cc9cbcbd52 3769:9338d0785277
1 /* Prosody IM
2 -- Copyright (C) 2008-2010 Matthew Wild
3 -- Copyright (C) 2008-2010 Waqas Hussain
4 --
5 -- This project is MIT/X11 licensed. Please see the
6 -- COPYING file in the source package for more information.
7 --
8 */
9
10 /*
11 * encodings.c
12 * Lua library for base64, stringprep and idna encodings
13 */
14
15 // Newer MSVC compilers deprecate strcpy as unsafe, but we use it in a safe way
16 #define _CRT_SECURE_NO_DEPRECATE
17
18 #include <string.h>
19 #include <stdlib.h>
20 #include "lua.h"
21 #include "lauxlib.h"
22
23 /***************** BASE64 *****************/
24
25 static const char code[]=
26 "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
27
28 static void base64_encode(luaL_Buffer *b, unsigned int c1, unsigned int c2, unsigned int c3, int n)
29 {
30 unsigned long tuple=c3+256UL*(c2+256UL*c1);
31 int i;
32 char s[4];
33 for (i=0; i<4; i++) {
34 s[3-i] = code[tuple % 64];
35 tuple /= 64;
36 }
37 for (i=n+1; i<4; i++) s[i]='=';
38 luaL_addlstring(b,s,4);
39 }
40
41 static int Lbase64_encode(lua_State *L) /** encode(s) */
42 {
43 size_t l;
44 const unsigned char *s=(const unsigned char*)luaL_checklstring(L,1,&l);
45 luaL_Buffer b;
46 int n;
47 luaL_buffinit(L,&b);
48 for (n=l/3; n--; s+=3) base64_encode(&b,s[0],s[1],s[2],3);
49 switch (l%3)
50 {
51 case 1: base64_encode(&b,s[0],0,0,1); break;
52 case 2: base64_encode(&b,s[0],s[1],0,2); break;
53 }
54 luaL_pushresult(&b);
55 return 1;
56 }
57
58 static void base64_decode(luaL_Buffer *b, int c1, int c2, int c3, int c4, int n)
59 {
60 unsigned long tuple=c4+64L*(c3+64L*(c2+64L*c1));
61 char s[3];
62 switch (--n)
63 {
64 case 3: s[2]=(char) tuple;
65 case 2: s[1]=(char) (tuple >> 8);
66 case 1: s[0]=(char) (tuple >> 16);
67 }
68 luaL_addlstring(b,s,n);
69 }
70
71 static int Lbase64_decode(lua_State *L) /** decode(s) */
72 {
73 size_t l;
74 const char *s=luaL_checklstring(L,1,&l);
75 luaL_Buffer b;
76 int n=0;
77 char t[4];
78 luaL_buffinit(L,&b);
79 for (;;)
80 {
81 int c=*s++;
82 switch (c)
83 {
84 const char *p;
85 default:
86 p=strchr(code,c); if (p==NULL) return 0;
87 t[n++]= (char) (p-code);
88 if (n==4)
89 {
90 base64_decode(&b,t[0],t[1],t[2],t[3],4);
91 n=0;
92 }
93 break;
94 case '=':
95 switch (n)
96 {
97 case 1: base64_decode(&b,t[0],0,0,0,1); break;
98 case 2: base64_decode(&b,t[0],t[1],0,0,2); break;
99 case 3: base64_decode(&b,t[0],t[1],t[2],0,3); break;
100 }
101 n=0;
102 break;
103 case 0:
104 luaL_pushresult(&b);
105 return 1;
106 case '\n': case '\r': case '\t': case ' ': case '\f': case '\b':
107 break;
108 }
109 }
110 }
111
112 static const luaL_Reg Reg_base64[] =
113 {
114 { "encode", Lbase64_encode },
115 { "decode", Lbase64_decode },
116 { NULL, NULL }
117 };
118
119 /***************** STRINGPREP *****************/
120 #ifndef USE_STRINGPREP_ICU
121 /****************** libidn ********************/
122
123 #include <stringprep.h>
124
125 static int stringprep_prep(lua_State *L, const Stringprep_profile *profile)
126 {
127 size_t len;
128 const char *s;
129 char string[1024];
130 int ret;
131 if(!lua_isstring(L, 1)) {
132 lua_pushnil(L);
133 return 1;
134 }
135 s = lua_tolstring(L, 1, &len);
136 if (len >= 1024) {
137 lua_pushnil(L);
138 return 1; // TODO return error message
139 }
140 strcpy(string, s);
141 ret = stringprep(string, 1024, (Stringprep_profile_flags)0, profile);
142 if (ret == STRINGPREP_OK) {
143 lua_pushstring(L, string);
144 return 1;
145 } else {
146 lua_pushnil(L);
147 return 1; // TODO return error message
148 }
149 }
150
151 #define MAKE_PREP_FUNC(myFunc, prep) \
152 static int myFunc(lua_State *L) { return stringprep_prep(L, prep); }
153
154 MAKE_PREP_FUNC(Lstringprep_nameprep, stringprep_nameprep) /** stringprep.nameprep(s) */
155 MAKE_PREP_FUNC(Lstringprep_nodeprep, stringprep_xmpp_nodeprep) /** stringprep.nodeprep(s) */
156 MAKE_PREP_FUNC(Lstringprep_resourceprep, stringprep_xmpp_resourceprep) /** stringprep.resourceprep(s) */
157 MAKE_PREP_FUNC(Lstringprep_saslprep, stringprep_saslprep) /** stringprep.saslprep(s) */
158
159 static const luaL_Reg Reg_stringprep[] =
160 {
161 { "nameprep", Lstringprep_nameprep },
162 { "nodeprep", Lstringprep_nodeprep },
163 { "resourceprep", Lstringprep_resourceprep },
164 { "saslprep", Lstringprep_saslprep },
165 { NULL, NULL }
166 };
167
168 #else
169 #include <unicode/usprep.h>
170 #include <unicode/ustring.h>
171 #include <unicode/utrace.h>
172
173 static int icu_stringprep_prep(lua_State *L, const UStringPrepProfile *profile)
174 {
175 size_t input_len;
176 int32_t unprepped_len, prepped_len, output_len;
177 const char *input;
178 char output[1024];
179
180 UChar unprepped[1024]; /* Temporary unicode buffer (1024 characters) */
181 UChar prepped[1024];
182
183 UErrorCode err = U_ZERO_ERROR;
184
185 if(!lua_isstring(L, 1)) {
186 lua_pushnil(L);
187 return 1;
188 }
189 input = lua_tolstring(L, 1, &input_len);
190 if (input_len >= 1024) {
191 lua_pushnil(L);
192 return 1;
193 }
194 u_strFromUTF8(unprepped, 1024, &unprepped_len, input, input_len, &err);
195 prepped_len = usprep_prepare(profile, unprepped, unprepped_len, prepped, 1024, 0, NULL, &err);
196 if (U_FAILURE(err)) {
197 lua_pushnil(L);
198 return 1;
199 } else {
200 u_strToUTF8(output, 1024, &output_len, prepped, prepped_len, &err);
201 if(output_len < 1024)
202 lua_pushlstring(L, output, output_len);
203 else
204 lua_pushnil(L);
205 return 1;
206 }
207 }
208
209 UStringPrepProfile *icu_nameprep;
210 UStringPrepProfile *icu_nodeprep;
211 UStringPrepProfile *icu_resourceprep;
212 UStringPrepProfile *icu_saslprep;
213
214 /* initialize global ICU stringprep profiles */
215 void init_icu()
216 {
217 UErrorCode err = U_ZERO_ERROR;
218 utrace_setLevel(UTRACE_VERBOSE);
219 icu_nameprep = usprep_openByType(USPREP_RFC3491_NAMEPREP, &err);
220 icu_nodeprep = usprep_openByType(USPREP_RFC3920_NODEPREP, &err);
221 icu_resourceprep = usprep_openByType(USPREP_RFC3920_RESOURCEPREP, &err);
222 icu_saslprep = usprep_openByType(USPREP_RFC4013_SASLPREP, &err);
223 if (U_FAILURE(err)) fprintf(stderr, "[c] util.encodings: error: %s\n", u_errorName((UErrorCode)err));
224 }
225
226 #define MAKE_PREP_FUNC(myFunc, prep) \
227 static int myFunc(lua_State *L) { return icu_stringprep_prep(L, prep); }
228
229 MAKE_PREP_FUNC(Lstringprep_nameprep, icu_nameprep) /** stringprep.nameprep(s) */
230 MAKE_PREP_FUNC(Lstringprep_nodeprep, icu_nodeprep) /** stringprep.nodeprep(s) */
231 MAKE_PREP_FUNC(Lstringprep_resourceprep, icu_resourceprep) /** stringprep.resourceprep(s) */
232 MAKE_PREP_FUNC(Lstringprep_saslprep, icu_saslprep) /** stringprep.saslprep(s) */
233
234 static const luaL_Reg Reg_stringprep[] =
235 {
236 { "nameprep", Lstringprep_nameprep },
237 { "nodeprep", Lstringprep_nodeprep },
238 { "resourceprep", Lstringprep_resourceprep },
239 { "saslprep", Lstringprep_saslprep },
240 { NULL, NULL }
241 };
242 #endif
243
244 /***************** IDNA *****************/
245 #ifndef USE_STRINGPREP_ICU
246 /****************** libidn ********************/
247
248 #include <idna.h>
249 #include <idn-free.h>
250
251 static int Lidna_to_ascii(lua_State *L) /** idna.to_ascii(s) */
252 {
253 size_t len;
254 const char *s = luaL_checklstring(L, 1, &len);
255 char* output = NULL;
256 int ret = idna_to_ascii_8z(s, &output, IDNA_USE_STD3_ASCII_RULES);
257 if (ret == IDNA_SUCCESS) {
258 lua_pushstring(L, output);
259 idn_free(output);
260 return 1;
261 } else {
262 lua_pushnil(L);
263 idn_free(output);
264 return 1; // TODO return error message
265 }
266 }
267
268 static int Lidna_to_unicode(lua_State *L) /** idna.to_unicode(s) */
269 {
270 size_t len;
271 const char *s = luaL_checklstring(L, 1, &len);
272 char* output = NULL;
273 int ret = idna_to_unicode_8z8z(s, &output, 0);
274 if (ret == IDNA_SUCCESS) {
275 lua_pushstring(L, output);
276 idn_free(output);
277 return 1;
278 } else {
279 lua_pushnil(L);
280 idn_free(output);
281 return 1; // TODO return error message
282 }
283 }
284 #else
285 #include <unicode/ustdio.h>
286 #include <unicode/uidna.h>
287 /* IDNA2003 or IDNA2008 ? ? ? */
288 static int Lidna_to_ascii(lua_State *L) /** idna.to_ascii(s) */
289 {
290 size_t len;
291 int32_t ulen, dest_len, output_len;
292 const char *s = luaL_checklstring(L, 1, &len);
293 UChar ustr[1024];
294 UErrorCode err = U_ZERO_ERROR;
295 UChar dest[1024];
296 char output[1024];
297
298 u_strFromUTF8(ustr, 1024, &ulen, s, len, &err);
299 dest_len = uidna_IDNToASCII(ustr, ulen, dest, 1024, UIDNA_USE_STD3_RULES, NULL, &err);
300 if (U_FAILURE(err)) {
301 lua_pushnil(L);
302 return 1;
303 } else {
304 u_strToUTF8(output, 1024, &output_len, dest, dest_len, &err);
305 if(output_len < 1024)
306 lua_pushlstring(L, output, output_len);
307 else
308 lua_pushnil(L);
309 return 1;
310 }
311 }
312
313 static int Lidna_to_unicode(lua_State *L) /** idna.to_unicode(s) */
314 {
315 size_t len;
316 int32_t ulen, dest_len, output_len;
317 const char *s = luaL_checklstring(L, 1, &len);
318 UChar* ustr;
319 UErrorCode err = U_ZERO_ERROR;
320 UChar dest[1024];
321 char output[1024];
322
323 u_strFromUTF8(ustr, 1024, &ulen, s, len, &err);
324 dest_len = uidna_IDNToUnicode(ustr, ulen, dest, 1024, UIDNA_USE_STD3_RULES, NULL, &err);
325 if (U_FAILURE(err)) {
326 lua_pushnil(L);
327 return 1;
328 } else {
329 u_strToUTF8(output, 1024, &output_len, dest, dest_len, &err);
330 if(output_len < 1024)
331 lua_pushlstring(L, output, output_len);
332 else
333 lua_pushnil(L);
334 return 1;
335 }
336 }
337 #endif
338
339 static const luaL_Reg Reg_idna[] =
340 {
341 { "to_ascii", Lidna_to_ascii },
342 { "to_unicode", Lidna_to_unicode },
343 { NULL, NULL }
344 };
345
346 /***************** end *****************/
347
348 static const luaL_Reg Reg[] =
349 {
350 { NULL, NULL }
351 };
352
353 LUALIB_API int luaopen_util_encodings(lua_State *L)
354 {
355 #ifdef USE_STRINGPREP_ICU
356 init_icu();
357 #endif
358 luaL_register(L, "encodings", Reg);
359
360 lua_pushliteral(L, "base64");
361 lua_newtable(L);
362 luaL_register(L, NULL, Reg_base64);
363 lua_settable(L,-3);
364
365 lua_pushliteral(L, "stringprep");
366 lua_newtable(L);
367 luaL_register(L, NULL, Reg_stringprep);
368 lua_settable(L,-3);
369
370 lua_pushliteral(L, "idna");
371 lua_newtable(L);
372 luaL_register(L, NULL, Reg_idna);
373 lua_settable(L,-3);
374
375 lua_pushliteral(L, "version"); /** version */
376 lua_pushliteral(L, "-3.14");
377 lua_settable(L,-3);
378 return 1;
379 }