1*cf5a6c84SAndroid Build Coastguard Worker /* demo_utf8towc() against libc mbrtowc()
2*cf5a6c84SAndroid Build Coastguard Worker *
3*cf5a6c84SAndroid Build Coastguard Worker * Copyright 2017 Rob Landley <[email protected]>
4*cf5a6c84SAndroid Build Coastguard Worker
5*cf5a6c84SAndroid Build Coastguard Worker USE_DEMO_UTF8TOWC(NEWTOY(demo_utf8towc, 0, TOYFLAG_USR|TOYFLAG_BIN))
6*cf5a6c84SAndroid Build Coastguard Worker
7*cf5a6c84SAndroid Build Coastguard Worker config DEMO_UTF8TOWC
8*cf5a6c84SAndroid Build Coastguard Worker bool "demo_utf8towc"
9*cf5a6c84SAndroid Build Coastguard Worker default n
10*cf5a6c84SAndroid Build Coastguard Worker help
11*cf5a6c84SAndroid Build Coastguard Worker usage: demo_utf8towc
12*cf5a6c84SAndroid Build Coastguard Worker
13*cf5a6c84SAndroid Build Coastguard Worker Print differences between toybox's utf8 conversion routines vs libc du jour.
14*cf5a6c84SAndroid Build Coastguard Worker */
15*cf5a6c84SAndroid Build Coastguard Worker
16*cf5a6c84SAndroid Build Coastguard Worker #include "toys.h"
17*cf5a6c84SAndroid Build Coastguard Worker
demo_utf8towc_main(void)18*cf5a6c84SAndroid Build Coastguard Worker void demo_utf8towc_main(void)
19*cf5a6c84SAndroid Build Coastguard Worker {
20*cf5a6c84SAndroid Build Coastguard Worker mbstate_t mb;
21*cf5a6c84SAndroid Build Coastguard Worker int len1, len2, maxlen = 0;
22*cf5a6c84SAndroid Build Coastguard Worker unsigned h, u, wc2;
23*cf5a6c84SAndroid Build Coastguard Worker wchar_t wc1;
24*cf5a6c84SAndroid Build Coastguard Worker char *str = (void *)&h;
25*cf5a6c84SAndroid Build Coastguard Worker
26*cf5a6c84SAndroid Build Coastguard Worker memset(&mb, 0, sizeof(mb));
27*cf5a6c84SAndroid Build Coastguard Worker // Although there are 0x10ffff unicode points, test all 4 byte combinations.
28*cf5a6c84SAndroid Build Coastguard Worker for (u = 1; u;) {
29*cf5a6c84SAndroid Build Coastguard Worker wc1 = wc2 = 0;
30*cf5a6c84SAndroid Build Coastguard Worker len2 = 4;
31*cf5a6c84SAndroid Build Coastguard Worker
32*cf5a6c84SAndroid Build Coastguard Worker h = SWAP_BE32(u);
33*cf5a6c84SAndroid Build Coastguard Worker len1 = mbrtowc(&wc1, str, len2, &mb);
34*cf5a6c84SAndroid Build Coastguard Worker if (len1<0) memset(&mb, 0, sizeof(mb));
35*cf5a6c84SAndroid Build Coastguard Worker len2 = utf8towc(&wc2, str, len2);
36*cf5a6c84SAndroid Build Coastguard Worker
37*cf5a6c84SAndroid Build Coastguard Worker if (wcwidth(wc2)>maxlen) maxlen = wcwidth(wc2);
38*cf5a6c84SAndroid Build Coastguard Worker if (len1 != len2 || wc1 != wc2)
39*cf5a6c84SAndroid Build Coastguard Worker printf("%x %d %x %d %x\n", u++, len1, wc1, len2, wc2);
40*cf5a6c84SAndroid Build Coastguard Worker else if (len2<1) u++;
41*cf5a6c84SAndroid Build Coastguard Worker else {
42*cf5a6c84SAndroid Build Coastguard Worker h = 1<<(8*(4-len2));
43*cf5a6c84SAndroid Build Coastguard Worker u &= ~(h-1);
44*cf5a6c84SAndroid Build Coastguard Worker u += h;
45*cf5a6c84SAndroid Build Coastguard Worker }
46*cf5a6c84SAndroid Build Coastguard Worker
47*cf5a6c84SAndroid Build Coastguard Worker }
48*cf5a6c84SAndroid Build Coastguard Worker dprintf(2, "maxlen=%d\n", maxlen);
49*cf5a6c84SAndroid Build Coastguard Worker }
50