mbsinit.c 2.4 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071
  1. /* Test for initial conversion state.
  2. Copyright (C) 2008-2021 Free Software Foundation, Inc.
  3. Written by Bruno Haible <bruno@clisp.org>, 2008.
  4. This file is free software: you can redistribute it and/or modify
  5. it under the terms of the GNU Lesser General Public License as
  6. published by the Free Software Foundation; either version 2.1 of the
  7. License, or (at your option) any later version.
  8. This file is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU Lesser General Public License for more details.
  12. You should have received a copy of the GNU Lesser General Public License
  13. along with this program. If not, see <https://www.gnu.org/licenses/>. */
  14. #include <config.h>
  15. /* Specification. */
  16. #include <wchar.h>
  17. #include "verify.h"
  18. #if GNULIB_defined_mbstate_t
  19. /* Platforms that lack mbsinit() also lack mbrlen(), mbrtowc(), mbsrtowcs()
  20. and wcrtomb(), wcsrtombs().
  21. We assume that
  22. - sizeof (mbstate_t) >= 4,
  23. - only stateless encodings are supported (such as UTF-8 and EUC-JP, but
  24. not ISO-2022 variants),
  25. - for each encoding, the number of bytes for a wide character is <= 4.
  26. (This maximum is attained for UTF-8, GB18030, EUC-TW.)
  27. We define the meaning of mbstate_t as follows:
  28. - In mb -> wc direction, mbstate_t's first byte contains the number of
  29. buffered bytes (in the range 0..3), followed by up to 3 buffered bytes.
  30. See mbrtowc.c.
  31. - In wc -> mb direction, mbstate_t contains no information. In other
  32. words, it is always in the initial state. */
  33. verify (sizeof (mbstate_t) >= 4);
  34. int
  35. mbsinit (const mbstate_t *ps)
  36. {
  37. const char *pstate = (const char *)ps;
  38. return pstate == NULL || pstate[0] == 0;
  39. }
  40. #else
  41. int
  42. mbsinit (const mbstate_t *ps)
  43. {
  44. # if defined _WIN32 && !defined __CYGWIN__
  45. /* Native Windows. */
  46. /* MSVC defines 'mbstate_t' as an 8-byte struct; the first 4 bytes matter.
  47. On mingw, 'mbstate_t' is sometimes defined as 'int', sometimes defined as
  48. an 8-byte struct, of which the first 4 bytes matter. */
  49. return ps == NULL || *(const unsigned int *)ps == 0;
  50. # else
  51. /* Minix, HP-UX 11.00, Solaris 2.6, Interix, ... */
  52. /* Maybe this definition works, maybe not... */
  53. return ps == NULL || *(const char *)ps == 0;
  54. # endif
  55. }
  56. #endif