mbsinit.c 2.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970
  1. /* Test for initial conversion state.
  2. Copyright (C) 2008-2023 Free Software Foundation, Inc.
  3. Written by Bruno Haible <bruno@clisp.org>, 2008.
  4. This file is free software: you can redistribute it and/or modify
  5. it under the terms of the GNU Lesser General Public License as
  6. published by the Free Software Foundation; either version 2.1 of the
  7. License, or (at your option) any later version.
  8. This file is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU Lesser General Public License for more details.
  12. You should have received a copy of the GNU Lesser General Public License
  13. along with this program. If not, see <https://www.gnu.org/licenses/>. */
  14. #include <config.h>
  15. /* Specification. */
  16. #include <wchar.h>
  17. #if GNULIB_defined_mbstate_t
  18. /* Platforms that lack mbsinit() also lack mbrlen(), mbrtowc(), mbsrtowcs()
  19. and wcrtomb(), wcsrtombs().
  20. We assume that
  21. - sizeof (mbstate_t) >= 4,
  22. - only stateless encodings are supported (such as UTF-8 and EUC-JP, but
  23. not ISO-2022 variants),
  24. - for each encoding, the number of bytes for a wide character is <= 4.
  25. (This maximum is attained for UTF-8, GB18030, EUC-TW.)
  26. We define the meaning of mbstate_t as follows:
  27. - In mb -> wc direction, mbstate_t's first byte contains the number of
  28. buffered bytes (in the range 0..3), followed by up to 3 buffered bytes.
  29. See mbrtowc.c.
  30. - In wc -> mb direction, mbstate_t contains no information. In other
  31. words, it is always in the initial state. */
  32. static_assert (sizeof (mbstate_t) >= 4);
  33. int
  34. mbsinit (const mbstate_t *ps)
  35. {
  36. const char *pstate = (const char *)ps;
  37. return pstate == NULL || pstate[0] == 0;
  38. }
  39. #else
  40. int
  41. mbsinit (const mbstate_t *ps)
  42. {
  43. # if defined _WIN32 && !defined __CYGWIN__
  44. /* Native Windows. */
  45. /* MSVC defines 'mbstate_t' as an 8-byte struct; the first 4 bytes matter.
  46. On mingw, 'mbstate_t' is sometimes defined as 'int', sometimes defined as
  47. an 8-byte struct, of which the first 4 bytes matter. */
  48. return ps == NULL || *(const unsigned int *)ps == 0;
  49. # else
  50. /* Minix, HP-UX 11.00, Solaris 2.6, Interix, ... */
  51. /* Maybe this definition works, maybe not... */
  52. return ps == NULL || *(const char *)ps == 0;
  53. # endif
  54. }
  55. #endif