gbku.h 2.5 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556
  1. /* This Source Code Form is subject to the terms of the Mozilla Public
  2. * License, v. 2.0. If a copy of the MPL was not distributed with this
  3. * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
  4. // =======================================================================
  5. // Original Author: Yueheng Xu
  6. // email: yueheng.xu@intel.com
  7. // phone: (503)264-2248
  8. // Intel Corporation, Oregon, USA
  9. // Last Update: September 7, 1999
  10. // Revision History:
  11. // 09/07/1999 - initial version.
  12. // 09/28/1999 - changed leftbyte and rightbyte from char to unsigned char
  13. // in struct DByte
  14. // 04/10/1999 - changed leftbyte. rightbyte to uint8_t in struct DByte;
  15. // added table UnicodeToGBKTable[0x5200]
  16. //
  17. // 05/16/2000 - added gUnicodeToGBKTableInitialized flag for optimization
  18. // ======================================================================================
  19. // Table GBKToUnicode[] maps the GBK code to its unicode.
  20. // The mapping data of this GBK table is obtained from
  21. // ftp://ftp.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/WINDOWS/CP936.TXT
  22. // Frank Tang of Netscape wrote the original perl tool to re-align the
  23. // mapping data into an 8-item per line format ( i.e. file cp936map.txt ).
  24. //
  25. // The valid GBK charset range: left byte is [0x81, 0xfe], right byte are
  26. // [0x40, 0x7e] and [0x80, 0xfe]. But for the convenience of index
  27. // calculation, the table here has a single consecutive range of
  28. // [0x40, 0xfe] for the right byte. Those invalid chars whose right byte
  29. // is 0x7f will be mapped to undefined unicode 0xFFFF.
  30. //
  31. //
  32. // Table UnicodeToGBK[] maps the unicode to GBK code. To reduce memory usage, we
  33. // only do Unicode to GBK table mapping for unicode between 0x4E00 and 0xA000;
  34. // Others let converter to do search from table GBKToUnicode[]. If we want further
  35. // trade memory for performance, we can let more unicode to do table mapping to get
  36. // its GBK instead of searching table GBKToUnicode[].
  37. #ifndef _GBKU_H__
  38. #define _GBKU_H__
  39. #define UCS2_NO_MAPPING ((char16_t) 0xfffd)
  40. #define UINT8_IN_RANGE(a, b, c) \
  41. (((uint8_t)(a) <= (uint8_t)(b))&&((uint8_t)(b) <= (uint8_t)(c)))
  42. #define UNICHAR_IN_RANGE(a, b, c) \
  43. (((char16_t)(a) <= (char16_t)(b))&&((char16_t)(b) <= (char16_t)(c)))
  44. #define CAST_CHAR_TO_UNICHAR(a) ((char16_t)((unsigned char)(a)))
  45. #define CAST_UNICHAR_TO_CHAR(a) ((char)a)
  46. #define IS_ASCII(a) (0==(0xff80 & (a)))
  47. #define IS_GBK_EURO(c) ((char)0x80 == (c))
  48. #define UCS2_EURO ((char16_t) 0x20ac)
  49. #include "nsGBKConvUtil.h"
  50. #endif /* _GBKU_H__ */