mbsinit.c 2.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970
  1. /* Test for initial conversion state.
  2. Copyright (C) 2008-2021 Free Software Foundation, Inc.
  3. Written by Bruno Haible <bruno@clisp.org>, 2008.
  4. This program is free software: you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 3 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program. If not, see <https://www.gnu.org/licenses/>. */
  14. #include <config.h>
  15. /* Specification. */
  16. #include <wchar.h>
  17. #include "verify.h"
  18. #if GNULIB_defined_mbstate_t
  19. /* Platforms that lack mbsinit() also lack mbrlen(), mbrtowc(), mbsrtowcs()
  20. and wcrtomb(), wcsrtombs().
  21. We assume that
  22. - sizeof (mbstate_t) >= 4,
  23. - only stateless encodings are supported (such as UTF-8 and EUC-JP, but
  24. not ISO-2022 variants),
  25. - for each encoding, the number of bytes for a wide character is <= 4.
  26. (This maximum is attained for UTF-8, GB18030, EUC-TW.)
  27. We define the meaning of mbstate_t as follows:
  28. - In mb -> wc direction, mbstate_t's first byte contains the number of
  29. buffered bytes (in the range 0..3), followed by up to 3 buffered bytes.
  30. See mbrtowc.c.
  31. - In wc -> mb direction, mbstate_t contains no information. In other
  32. words, it is always in the initial state. */
  33. verify (sizeof (mbstate_t) >= 4);
  34. int
  35. mbsinit (const mbstate_t *ps)
  36. {
  37. const char *pstate = (const char *)ps;
  38. return pstate == NULL || pstate[0] == 0;
  39. }
  40. #else
  41. int
  42. mbsinit (const mbstate_t *ps)
  43. {
  44. # if defined _WIN32 && !defined __CYGWIN__
  45. /* Native Windows. */
  46. /* MSVC defines 'mbstate_t' as an 8-byte struct; the first 4 bytes matter.
  47. On mingw, 'mbstate_t' is sometimes defined as 'int', sometimes defined as
  48. an 8-byte struct, of which the first 4 bytes matter. */
  49. return ps == NULL || *(const unsigned int *)ps == 0;
  50. # else
  51. /* Minix, HP-UX 11.00, Solaris 2.6, Interix, ... */
  52. /* Maybe this definition works, maybe not... */
  53. return ps == NULL || *(const char *)ps == 0;
  54. # endif
  55. }
  56. #endif