mbrtowc.c 833 B

1234567891011121314151617181920212223242526272829
  1. #include <stdio.h>
  2. #include <string.h>
  3. #include <wchar.h>
  4. int main(void) {
  5. mbstate_t state;
  6. memset(&state, 0, sizeof state);
  7. char in[] = u8"z\u00df\u6c34\U0001F34C"; // or u8"zß水🍌"
  8. size_t in_sz = sizeof in / sizeof *in;
  9. printf("Processing %zu UTF-8 code units: [ ", in_sz); //Should be 11 regular chars
  10. for(size_t n = 0; n < in_sz; ++n) printf("%#x ", (unsigned char)in[n]);
  11. puts("]");
  12. wchar_t out[in_sz];
  13. char *p_in = in, *end = in + in_sz;
  14. wchar_t *p_out = out;
  15. int rc;
  16. while((rc = mbrtowc(p_out, p_in, end - p_in, &state)) > 0)
  17. {
  18. p_in += rc;
  19. p_out += 1;
  20. }
  21. size_t out_sz = p_out - out + 1;
  22. printf("into %zu wchar_t units: [ ", out_sz); //Should be 5 wchars
  23. for(size_t x = 0; x < out_sz; ++x) printf("%#x ", out[x]);
  24. puts("]");
  25. }