@@ -16,6 +16,22 @@ use errors::DiagnosticBuilder;
16
16
use super :: StringReader ;
17
17
18
18
const UNICODE_ARRAY : & ' static [ ( char , & ' static str , char ) ] = & [
19
+ ( ' ' , "No-Break Space" , ' ' ) ,
20
+ ( ' ' , "Ogham Space Mark" , ' ' ) ,
21
+ ( ' ' , "En Quad" , ' ' ) ,
22
+ ( ' ' , "Em Quad" , ' ' ) ,
23
+ ( ' ' , "En Space" , ' ' ) ,
24
+ ( ' ' , "Em Space" , ' ' ) ,
25
+ ( ' ' , "Three-Per-Em Space" , ' ' ) ,
26
+ ( ' ' , "Four-Per-Em Space" , ' ' ) ,
27
+ ( ' ' , "Six-Per-Em Space" , ' ' ) ,
28
+ ( ' ' , "Figure Space" , ' ' ) ,
29
+ ( ' ' , "Punctuation Space" , ' ' ) ,
30
+ ( ' ' , "Thin Space" , ' ' ) ,
31
+ ( ' ' , "Hair Space" , ' ' ) ,
32
+ ( ' ' , "Narrow No-Break Space" , ' ' ) ,
33
+ ( ' ' , "Medium Mathematical Space" , ' ' ) ,
34
+ ( ' ' , "Ideographic Space" , ' ' ) ,
19
35
( 'ߺ' , "Nko Lajanyalan" , '_' ) ,
20
36
( '﹍' , "Dashed Low Line" , '_' ) ,
21
37
( '﹎' , "Centreline Low Line" , '_' ) ,
@@ -24,14 +40,18 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
24
40
( '‑' , "Non-Breaking Hyphen" , '-' ) ,
25
41
( '‒' , "Figure Dash" , '-' ) ,
26
42
( '–' , "En Dash" , '-' ) ,
43
+ ( '—' , "Em Dash" , '-' ) ,
27
44
( '﹘' , "Small Em Dash" , '-' ) ,
28
45
( '⁃' , "Hyphen Bullet" , '-' ) ,
29
46
( '˗' , "Modifier Letter Minus Sign" , '-' ) ,
30
47
( '−' , "Minus Sign" , '-' ) ,
48
+ ( 'ー' , "Katakana-Hiragana Prolonged Sound Mark" , '-' ) ,
31
49
( '٫' , "Arabic Decimal Separator" , ',' ) ,
32
50
( '‚' , "Single Low-9 Quotation Mark" , ',' ) ,
33
51
( 'ꓹ' , "Lisu Letter Tone Na Po" , ',' ) ,
52
+ ( ',' , "Fullwidth Comma" , ',' ) ,
34
53
( ';' , "Greek Question Mark" , ';' ) ,
54
+ ( ';' , "Fullwidth Semicolon" , ';' ) ,
35
55
( 'ः' , "Devanagari Sign Visarga" , ':' ) ,
36
56
( 'ઃ' , "Gujarati Sign Visarga" , ':' ) ,
37
57
( ':' , "Fullwidth Colon" , ':' ) ,
@@ -53,16 +73,20 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
53
73
( 'ʔ' , "Latin Letter Glottal Stop" , '?' ) ,
54
74
( 'ॽ' , "Devanagari Letter Glottal Stop" , '?' ) ,
55
75
( 'Ꭾ' , "Cherokee Letter He" , '?' ) ,
76
+ ( '?' , "Fullwidth Question Mark" , '?' ) ,
56
77
( '𝅭' , "Musical Symbol Combining Augmentation Dot" , '.' ) ,
57
78
( '․' , "One Dot Leader" , '.' ) ,
58
79
( '۔' , "Arabic Full Stop" , '.' ) ,
59
80
( '܁' , "Syriac Supralinear Full Stop" , '.' ) ,
60
81
( '܂' , "Syriac Sublinear Full Stop" , '.' ) ,
61
82
( '꘎' , "Vai Full Stop" , '.' ) ,
62
83
( '𐩐' , "Kharoshthi Punctuation Dot" , '.' ) ,
84
+ ( '·' , "Middle Dot" , '.' ) ,
63
85
( '٠' , "Arabic-Indic Digit Zero" , '.' ) ,
64
86
( '۰' , "Extended Arabic-Indic Digit Zero" , '.' ) ,
65
87
( 'ꓸ' , "Lisu Letter Tone Mya Ti" , '.' ) ,
88
+ ( '。' , "Ideographic Full Stop" , '.' ) ,
89
+ ( '・' , "Katakana Middle Dot" , '.' ) ,
66
90
( '՝' , "Armenian Comma" , '\'' ) ,
67
91
( ''' , "Fullwidth Apostrophe" , '\'' ) ,
68
92
( '‘' , "Left Single Quotation Mark" , '\'' ) ,
@@ -108,16 +132,30 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
108
132
( 'ײ' , "Hebrew Ligature Yiddish Double Yod" , '"' ) ,
109
133
( '❞' , "Heavy Double Comma Quotation Mark Ornament" , '"' ) ,
110
134
( '❝' , "Heavy Double Turned Comma Quotation Mark Ornament" , '"' ) ,
111
- ( '[' , "Fullwidth Left Square Bracket" , '(' ) ,
112
135
( '❨' , "Medium Left Parenthesis Ornament" , '(' ) ,
113
- ( '❲' , "Light Left Tortoise Shell Bracket Ornament" , '(' ) ,
114
- ( '〔' , "Left Tortoise Shell Bracket" , '(' ) ,
115
136
( '﴾' , "Ornate Left Parenthesis" , '(' ) ,
116
- ( '] ' , "Fullwidth Right Square Bracket " , ') ' ) ,
137
+ ( '( ' , "Fullwidth Left Parenthesis " , '( ' ) ,
117
138
( '❩' , "Medium Right Parenthesis Ornament" , ')' ) ,
118
- ( '❳' , "Light Right Tortoise Shell Bracket Ornament" , ')' ) ,
119
- ( '〕' , "Right Tortoise Shell Bracket" , ')' ) ,
120
139
( '﴿' , "Ornate Right Parenthesis" , ')' ) ,
140
+ ( ')' , "Fullwidth Right Parenthesis" , ')' ) ,
141
+ ( '[' , "Fullwidth Left Square Bracket" , '[' ) ,
142
+ ( '❲' , "Light Left Tortoise Shell Bracket Ornament" , '[' ) ,
143
+ ( '「' , "Left Corner Bracket" , '[' ) ,
144
+ ( '『' , "Left White Corner Bracket" , '[' ) ,
145
+ ( '【' , "Left Black Lenticular Bracket" , '[' ) ,
146
+ ( '〔' , "Left Tortoise Shell Bracket" , '[' ) ,
147
+ ( '〖' , "Left White Lenticular Bracket" , '[' ) ,
148
+ ( '〘' , "Left White Tortoise Shell Bracket" , '[' ) ,
149
+ ( '〚' , "Left White Square Bracket" , '[' ) ,
150
+ ( ']' , "Fullwidth Right Square Bracket" , ']' ) ,
151
+ ( '❳' , "Light Right Tortoise Shell Bracket Ornament" , ']' ) ,
152
+ ( '」' , "Right Corner Bracket" , ']' ) ,
153
+ ( '』' , "Right White Corner Bracket" , ']' ) ,
154
+ ( '】' , "Right Black Lenticular Bracket" , ']' ) ,
155
+ ( '〕' , "Right Tortoise Shell Bracket" , ']' ) ,
156
+ ( '〗' , "Right White Lenticular Bracket" , ']' ) ,
157
+ ( '〙' , "Right White Tortoise Shell Bracket" , ']' ) ,
158
+ ( '〛' , "Right White Square Bracket" , ']' ) ,
121
159
( '❴' , "Medium Left Curly Bracket Ornament" , '{' ) ,
122
160
( '❵' , "Medium Right Curly Bracket Ornament" , '}' ) ,
123
161
( '⁎' , "Low Asterisk" , '*' ) ,
@@ -140,6 +178,8 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
140
178
( '⟍' , "Mathematical Falling Diagonal" , '\\' ) ,
141
179
( '⧵' , "Reverse Solidus Operator" , '\\' ) ,
142
180
( '⧹' , "Big Reverse Solidus" , '\\' ) ,
181
+ ( '、' , "Ideographic Comma" , '\\' ) ,
182
+ ( 'ヽ' , "Katakana Iteration Mark" , '\\' ) ,
143
183
( '㇔' , "Cjk Stroke D" , '\\' ) ,
144
184
( '丶' , "Cjk Unified Ideograph-4E36" , '\\' ) ,
145
185
( '⼂' , "Kangxi Radical Dot" , '\\' ) ,
@@ -148,15 +188,20 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
148
188
( '‹' , "Single Left-Pointing Angle Quotation Mark" , '<' ) ,
149
189
( '❮' , "Heavy Left-Pointing Angle Quotation Mark Ornament" , '<' ) ,
150
190
( '˂' , "Modifier Letter Left Arrowhead" , '<' ) ,
191
+ ( '〈' , "Left Angle Bracket" , '<' ) ,
192
+ ( '《' , "Left Double Angle Bracket" , '<' ) ,
151
193
( '꓿' , "Lisu Punctuation Full Stop" , '=' ) ,
152
194
( '›' , "Single Right-Pointing Angle Quotation Mark" , '>' ) ,
153
195
( '❯' , "Heavy Right-Pointing Angle Quotation Mark Ornament" , '>' ) ,
154
196
( '˃' , "Modifier Letter Right Arrowhead" , '>' ) ,
197
+ ( '〉' , "Right Angle Bracket" , '>' ) ,
198
+ ( '》' , "Right Double Angle Bracket" , '>' ) ,
155
199
( 'Ⲻ' , "Coptic Capital Letter Dialect-P Ni" , '-' ) ,
156
200
( 'Ɂ' , "Latin Capital Letter Glottal Stop" , '?' ) ,
157
201
( 'Ⳇ' , "Coptic Capital Letter Old Coptic Esh" , '/' ) , ] ;
158
202
159
203
const ASCII_ARRAY : & ' static [ ( char , & ' static str ) ] = & [
204
+ ( ' ' , "Space" ) ,
160
205
( '_' , "Underscore" ) ,
161
206
( '-' , "Minus/Hyphen" ) ,
162
207
( ',' , "Comma" ) ,
@@ -169,6 +214,8 @@ const ASCII_ARRAY: &'static [(char, &'static str)] = &[
169
214
( '"' , "Quotation Mark" ) ,
170
215
( '(' , "Left Parenthesis" ) ,
171
216
( ')' , "Right Parenthesis" ) ,
217
+ ( '[' , "Left Square Bracket" ) ,
218
+ ( ']' , "Right Square Bracket" ) ,
172
219
( '{' , "Left Curly Brace" ) ,
173
220
( '}' , "Right Curly Brace" ) ,
174
221
( '*' , "Asterisk" ) ,
0 commit comments