toybox/toys/example/demo_utf8towc.c
<<
>>
Prefs
   1/* demo_utf8towc() against libc mbrtowc()
   2 *
   3 * Copyright 2017 Rob Landley <rob@landley.net>
   4
   5USE_DEMO_UTF8TOWC(NEWTOY(demo_utf8towc, 0, TOYFLAG_USR|TOYFLAG_BIN))
   6
   7config DEMO_UTF8TOWC
   8  bool "demo_utf8towc"
   9  default n
  10  help
  11    usage: demo_utf8towc
  12
  13    Print differences between toybox's utf8 conversion routines vs libc du jour.
  14*/
  15
  16#include "toys.h"
  17
  18void demo_utf8towc_main(void)
  19{
  20  mbstate_t mb;
  21  int len1, len2;
  22  unsigned u, h, wc2;
  23  wchar_t wc1;
  24
  25  memset(&mb, 0, sizeof(mb));
  26  for (u = 1; u<=0x10ffff; u++) {
  27    char *str = (void *)&h;
  28
  29    wc1 = wc2 = 0;
  30    len2 = 4;
  31    h = htonl(u);
  32    while (!*str) str++, len2--;
  33
  34    len1 = mbrtowc(&wc1, str, len2, &mb);
  35    if (len1<0) memset(&mb, 0, sizeof(mb));
  36    len2 = utf8towc(&wc2, str, len2);
  37    if (len1 != len2 || wc1 != wc2)
  38      printf("%x %d %x %d %x\n", u, len1, wc1, len2, wc2);
  39  }
  40}
  41