Commit version string files.
[disorder] / lib / unidata.h
1 /** @file lib/unidata.h
2 * @brief Unicode tables
3 *
4 * Automatically generated file, see scripts/make-unidata
5 *
6 * DO NOT EDIT.
7 */
8 #ifndef UNIDATA_H
9 #define UNIDATA_H
10 enum unicode_General_Category {
11 unicode_General_Category_Cc,
12 unicode_General_Category_Cf,
13 unicode_General_Category_Cn,
14 unicode_General_Category_Co,
15 unicode_General_Category_Cs,
16 unicode_General_Category_Ll,
17 unicode_General_Category_Lm,
18 unicode_General_Category_Lo,
19 unicode_General_Category_Lt,
20 unicode_General_Category_Lu,
21 unicode_General_Category_Mc,
22 unicode_General_Category_Me,
23 unicode_General_Category_Mn,
24 unicode_General_Category_Nd,
25 unicode_General_Category_Nl,
26 unicode_General_Category_No,
27 unicode_General_Category_Pc,
28 unicode_General_Category_Pd,
29 unicode_General_Category_Pe,
30 unicode_General_Category_Pf,
31 unicode_General_Category_Pi,
32 unicode_General_Category_Po,
33 unicode_General_Category_Ps,
34 unicode_General_Category_Sc,
35 unicode_General_Category_Sk,
36 unicode_General_Category_Sm,
37 unicode_General_Category_So,
38 unicode_General_Category_Zl,
39 unicode_General_Category_Zp,
40 unicode_General_Category_Zs
41 };
42 enum unicode_Grapheme_Break {
43 unicode_Grapheme_Break_CR,
44 unicode_Grapheme_Break_Control,
45 unicode_Grapheme_Break_Extend,
46 unicode_Grapheme_Break_L,
47 unicode_Grapheme_Break_LF,
48 unicode_Grapheme_Break_LV,
49 unicode_Grapheme_Break_LVT,
50 unicode_Grapheme_Break_Other,
51 unicode_Grapheme_Break_Prepend,
52 unicode_Grapheme_Break_SpacingMark,
53 unicode_Grapheme_Break_T,
54 unicode_Grapheme_Break_V
55 };
56 extern const char *const unicode_Grapheme_Break_names[];
57 enum unicode_Word_Break {
58 unicode_Word_Break_ALetter,
59 unicode_Word_Break_CR,
60 unicode_Word_Break_Extend,
61 unicode_Word_Break_ExtendNumLet,
62 unicode_Word_Break_Format,
63 unicode_Word_Break_Katakana,
64 unicode_Word_Break_LF,
65 unicode_Word_Break_MidLetter,
66 unicode_Word_Break_MidNum,
67 unicode_Word_Break_MidNumLet,
68 unicode_Word_Break_Newline,
69 unicode_Word_Break_Numeric,
70 unicode_Word_Break_Other
71 };
72 extern const char *const unicode_Word_Break_names[];
73 enum unicode_Sentence_Break {
74 unicode_Sentence_Break_ATerm,
75 unicode_Sentence_Break_CR,
76 unicode_Sentence_Break_Close,
77 unicode_Sentence_Break_Extend,
78 unicode_Sentence_Break_Format,
79 unicode_Sentence_Break_LF,
80 unicode_Sentence_Break_Lower,
81 unicode_Sentence_Break_Numeric,
82 unicode_Sentence_Break_OLetter,
83 unicode_Sentence_Break_Other,
84 unicode_Sentence_Break_SContinue,
85 unicode_Sentence_Break_STerm,
86 unicode_Sentence_Break_Sep,
87 unicode_Sentence_Break_Sp,
88 unicode_Sentence_Break_Upper
89 };
90 extern const char *const unicode_Sentence_Break_names[];
91 enum unicode_flags {
92 unicode_normalize_before_casefold = 1,
93 unicode_compatibility_decomposition = 2
94 };
95
96 struct unidata {
97 const uint32_t *decomp;
98 const uint32_t *casefold;
99 const uint32_t *composed;
100 unsigned char ccc;
101 char general_category;
102 uint8_t flags;
103 char grapheme_break;
104 char word_break;
105 char sentence_break;
106 };
107 extern const struct unidata *const unidata[];
108 extern const struct unicode_utf8_row {
109 uint8_t count;
110 uint8_t min2, max2;
111 } unicode_utf8_valid[];
112 #define UNICODE_NCHARS 1114112
113 #define UNICODE_MODULUS 16
114 #define UNICODE_BREAK_START 196608
115 #define UNICODE_BREAK_END 917504
116 #define UNICODE_BREAK_TOP 918016
117 #endif