ucp.h 3.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133
  1. /*************************************************
  2. * Unicode Property Table handler *
  3. *************************************************/
  4. #ifndef _UCP_H
  5. #define _UCP_H
  6. /* This file contains definitions of the property values that are returned by
  7. the function _pcre_ucp_findprop(). New values that are added for new releases
  8. of Unicode should always be at the end of each enum, for backwards
  9. compatibility. */
  10. /* These are the general character categories. */
  11. enum {
  12. ucp_C, /* Other */
  13. ucp_L, /* Letter */
  14. ucp_M, /* Mark */
  15. ucp_N, /* Number */
  16. ucp_P, /* Punctuation */
  17. ucp_S, /* Symbol */
  18. ucp_Z /* Separator */
  19. };
  20. /* These are the particular character types. */
  21. enum {
  22. ucp_Cc, /* Control */
  23. ucp_Cf, /* Format */
  24. ucp_Cn, /* Unassigned */
  25. ucp_Co, /* Private use */
  26. ucp_Cs, /* Surrogate */
  27. ucp_Ll, /* Lower case letter */
  28. ucp_Lm, /* Modifier letter */
  29. ucp_Lo, /* Other letter */
  30. ucp_Lt, /* Title case letter */
  31. ucp_Lu, /* Upper case letter */
  32. ucp_Mc, /* Spacing mark */
  33. ucp_Me, /* Enclosing mark */
  34. ucp_Mn, /* Non-spacing mark */
  35. ucp_Nd, /* Decimal number */
  36. ucp_Nl, /* Letter number */
  37. ucp_No, /* Other number */
  38. ucp_Pc, /* Connector punctuation */
  39. ucp_Pd, /* Dash punctuation */
  40. ucp_Pe, /* Close punctuation */
  41. ucp_Pf, /* Final punctuation */
  42. ucp_Pi, /* Initial punctuation */
  43. ucp_Po, /* Other punctuation */
  44. ucp_Ps, /* Open punctuation */
  45. ucp_Sc, /* Currency symbol */
  46. ucp_Sk, /* Modifier symbol */
  47. ucp_Sm, /* Mathematical symbol */
  48. ucp_So, /* Other symbol */
  49. ucp_Zl, /* Line separator */
  50. ucp_Zp, /* Paragraph separator */
  51. ucp_Zs /* Space separator */
  52. };
  53. /* These are the script identifications. */
  54. enum {
  55. ucp_Arabic,
  56. ucp_Armenian,
  57. ucp_Bengali,
  58. ucp_Bopomofo,
  59. ucp_Braille,
  60. ucp_Buginese,
  61. ucp_Buhid,
  62. ucp_Canadian_Aboriginal,
  63. ucp_Cherokee,
  64. ucp_Common,
  65. ucp_Coptic,
  66. ucp_Cypriot,
  67. ucp_Cyrillic,
  68. ucp_Deseret,
  69. ucp_Devanagari,
  70. ucp_Ethiopic,
  71. ucp_Georgian,
  72. ucp_Glagolitic,
  73. ucp_Gothic,
  74. ucp_Greek,
  75. ucp_Gujarati,
  76. ucp_Gurmukhi,
  77. ucp_Han,
  78. ucp_Hangul,
  79. ucp_Hanunoo,
  80. ucp_Hebrew,
  81. ucp_Hiragana,
  82. ucp_Inherited,
  83. ucp_Kannada,
  84. ucp_Katakana,
  85. ucp_Kharoshthi,
  86. ucp_Khmer,
  87. ucp_Lao,
  88. ucp_Latin,
  89. ucp_Limbu,
  90. ucp_Linear_B,
  91. ucp_Malayalam,
  92. ucp_Mongolian,
  93. ucp_Myanmar,
  94. ucp_New_Tai_Lue,
  95. ucp_Ogham,
  96. ucp_Old_Italic,
  97. ucp_Old_Persian,
  98. ucp_Oriya,
  99. ucp_Osmanya,
  100. ucp_Runic,
  101. ucp_Shavian,
  102. ucp_Sinhala,
  103. ucp_Syloti_Nagri,
  104. ucp_Syriac,
  105. ucp_Tagalog,
  106. ucp_Tagbanwa,
  107. ucp_Tai_Le,
  108. ucp_Tamil,
  109. ucp_Telugu,
  110. ucp_Thaana,
  111. ucp_Thai,
  112. ucp_Tibetan,
  113. ucp_Tifinagh,
  114. ucp_Ugaritic,
  115. ucp_Yi,
  116. ucp_Balinese, /* New for Unicode 5.0.0 */
  117. ucp_Cuneiform, /* New for Unicode 5.0.0 */
  118. ucp_Nko, /* New for Unicode 5.0.0 */
  119. ucp_Phags_Pa, /* New for Unicode 5.0.0 */
  120. ucp_Phoenician /* New for Unicode 5.0.0 */
  121. };
  122. #endif
  123. /* End of ucp.h */