@@ -16,6 +16,22 @@ use errors::DiagnosticBuilder;
1616use super :: StringReader ;
1717
1818const UNICODE_ARRAY : & ' static [ ( char , & ' static str , char ) ] = & [
19+ ( ' ' , "No-Break Space" , ' ' ) ,
20+ ( ' ' , "Ogham Space Mark" , ' ' ) ,
21+ ( ' ' , "En Quad" , ' ' ) ,
22+ ( ' ' , "Em Quad" , ' ' ) ,
23+ ( ' ' , "En Space" , ' ' ) ,
24+ ( ' ' , "Em Space" , ' ' ) ,
25+ ( ' ' , "Three-Per-Em Space" , ' ' ) ,
26+ ( ' ' , "Four-Per-Em Space" , ' ' ) ,
27+ ( ' ' , "Six-Per-Em Space" , ' ' ) ,
28+ ( ' ' , "Figure Space" , ' ' ) ,
29+ ( ' ' , "Punctuation Space" , ' ' ) ,
30+ ( ' ' , "Thin Space" , ' ' ) ,
31+ ( ' ' , "Hair Space" , ' ' ) ,
32+ ( ' ' , "Narrow No-Break Space" , ' ' ) ,
33+ ( ' ' , "Medium Mathematical Space" , ' ' ) ,
34+ ( ' ' , "Ideographic Space" , ' ' ) ,
1935 ( 'ߺ' , "Nko Lajanyalan" , '_' ) ,
2036 ( '﹍' , "Dashed Low Line" , '_' ) ,
2137 ( '﹎' , "Centreline Low Line" , '_' ) ,
@@ -24,14 +40,18 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
2440 ( '‑' , "Non-Breaking Hyphen" , '-' ) ,
2541 ( '‒' , "Figure Dash" , '-' ) ,
2642 ( '–' , "En Dash" , '-' ) ,
43+ ( '—' , "Em Dash" , '-' ) ,
2744 ( '﹘' , "Small Em Dash" , '-' ) ,
2845 ( '⁃' , "Hyphen Bullet" , '-' ) ,
2946 ( '˗' , "Modifier Letter Minus Sign" , '-' ) ,
3047 ( '−' , "Minus Sign" , '-' ) ,
48+ ( 'ー' , "Katakana-Hiragana Prolonged Sound Mark" , '-' ) ,
3149 ( '٫' , "Arabic Decimal Separator" , ',' ) ,
3250 ( '‚' , "Single Low-9 Quotation Mark" , ',' ) ,
3351 ( 'ꓹ' , "Lisu Letter Tone Na Po" , ',' ) ,
52+ ( ',' , "Fullwidth Comma" , ',' ) ,
3453 ( ';' , "Greek Question Mark" , ';' ) ,
54+ ( ';' , "Fullwidth Semicolon" , ';' ) ,
3555 ( 'ः' , "Devanagari Sign Visarga" , ':' ) ,
3656 ( 'ઃ' , "Gujarati Sign Visarga" , ':' ) ,
3757 ( ':' , "Fullwidth Colon" , ':' ) ,
@@ -53,16 +73,20 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
5373 ( 'ʔ' , "Latin Letter Glottal Stop" , '?' ) ,
5474 ( 'ॽ' , "Devanagari Letter Glottal Stop" , '?' ) ,
5575 ( 'Ꭾ' , "Cherokee Letter He" , '?' ) ,
76+ ( '?' , "Fullwidth Question Mark" , '?' ) ,
5677 ( '𝅭' , "Musical Symbol Combining Augmentation Dot" , '.' ) ,
5778 ( '․' , "One Dot Leader" , '.' ) ,
5879 ( '۔' , "Arabic Full Stop" , '.' ) ,
5980 ( '܁' , "Syriac Supralinear Full Stop" , '.' ) ,
6081 ( '܂' , "Syriac Sublinear Full Stop" , '.' ) ,
6182 ( '꘎' , "Vai Full Stop" , '.' ) ,
6283 ( '𐩐' , "Kharoshthi Punctuation Dot" , '.' ) ,
84+ ( '·' , "Middle Dot" , '.' ) ,
6385 ( '٠' , "Arabic-Indic Digit Zero" , '.' ) ,
6486 ( '۰' , "Extended Arabic-Indic Digit Zero" , '.' ) ,
6587 ( 'ꓸ' , "Lisu Letter Tone Mya Ti" , '.' ) ,
88+ ( '。' , "Ideographic Full Stop" , '.' ) ,
89+ ( '・' , "Katakana Middle Dot" , '.' ) ,
6690 ( '՝' , "Armenian Comma" , '\'' ) ,
6791 ( ''' , "Fullwidth Apostrophe" , '\'' ) ,
6892 ( '‘' , "Left Single Quotation Mark" , '\'' ) ,
@@ -108,16 +132,30 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
108132 ( 'ײ' , "Hebrew Ligature Yiddish Double Yod" , '"' ) ,
109133 ( '❞' , "Heavy Double Comma Quotation Mark Ornament" , '"' ) ,
110134 ( '❝' , "Heavy Double Turned Comma Quotation Mark Ornament" , '"' ) ,
111- ( '[' , "Fullwidth Left Square Bracket" , '(' ) ,
112135 ( '❨' , "Medium Left Parenthesis Ornament" , '(' ) ,
113- ( '❲' , "Light Left Tortoise Shell Bracket Ornament" , '(' ) ,
114- ( '〔' , "Left Tortoise Shell Bracket" , '(' ) ,
115136 ( '﴾' , "Ornate Left Parenthesis" , '(' ) ,
116- ( '] ' , "Fullwidth Right Square Bracket " , ') ' ) ,
137+ ( '( ' , "Fullwidth Left Parenthesis " , '( ' ) ,
117138 ( '❩' , "Medium Right Parenthesis Ornament" , ')' ) ,
118- ( '❳' , "Light Right Tortoise Shell Bracket Ornament" , ')' ) ,
119- ( '〕' , "Right Tortoise Shell Bracket" , ')' ) ,
120139 ( '﴿' , "Ornate Right Parenthesis" , ')' ) ,
140+ ( ')' , "Fullwidth Right Parenthesis" , ')' ) ,
141+ ( '[' , "Fullwidth Left Square Bracket" , '[' ) ,
142+ ( '❲' , "Light Left Tortoise Shell Bracket Ornament" , '[' ) ,
143+ ( '「' , "Left Corner Bracket" , '[' ) ,
144+ ( '『' , "Left White Corner Bracket" , '[' ) ,
145+ ( '【' , "Left Black Lenticular Bracket" , '[' ) ,
146+ ( '〔' , "Left Tortoise Shell Bracket" , '[' ) ,
147+ ( '〖' , "Left White Lenticular Bracket" , '[' ) ,
148+ ( '〘' , "Left White Tortoise Shell Bracket" , '[' ) ,
149+ ( '〚' , "Left White Square Bracket" , '[' ) ,
150+ ( ']' , "Fullwidth Right Square Bracket" , ']' ) ,
151+ ( '❳' , "Light Right Tortoise Shell Bracket Ornament" , ']' ) ,
152+ ( '」' , "Right Corner Bracket" , ']' ) ,
153+ ( '』' , "Right White Corner Bracket" , ']' ) ,
154+ ( '】' , "Right Black Lenticular Bracket" , ']' ) ,
155+ ( '〕' , "Right Tortoise Shell Bracket" , ']' ) ,
156+ ( '〗' , "Right White Lenticular Bracket" , ']' ) ,
157+ ( '〙' , "Right White Tortoise Shell Bracket" , ']' ) ,
158+ ( '〛' , "Right White Square Bracket" , ']' ) ,
121159 ( '❴' , "Medium Left Curly Bracket Ornament" , '{' ) ,
122160 ( '❵' , "Medium Right Curly Bracket Ornament" , '}' ) ,
123161 ( '⁎' , "Low Asterisk" , '*' ) ,
@@ -140,6 +178,8 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
140178 ( '⟍' , "Mathematical Falling Diagonal" , '\\' ) ,
141179 ( '⧵' , "Reverse Solidus Operator" , '\\' ) ,
142180 ( '⧹' , "Big Reverse Solidus" , '\\' ) ,
181+ ( '、' , "Ideographic Comma" , '\\' ) ,
182+ ( 'ヽ' , "Katakana Iteration Mark" , '\\' ) ,
143183 ( '㇔' , "Cjk Stroke D" , '\\' ) ,
144184 ( '丶' , "Cjk Unified Ideograph-4E36" , '\\' ) ,
145185 ( '⼂' , "Kangxi Radical Dot" , '\\' ) ,
@@ -148,15 +188,20 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
148188 ( '‹' , "Single Left-Pointing Angle Quotation Mark" , '<' ) ,
149189 ( '❮' , "Heavy Left-Pointing Angle Quotation Mark Ornament" , '<' ) ,
150190 ( '˂' , "Modifier Letter Left Arrowhead" , '<' ) ,
191+ ( '〈' , "Left Angle Bracket" , '<' ) ,
192+ ( '《' , "Left Double Angle Bracket" , '<' ) ,
151193 ( '꓿' , "Lisu Punctuation Full Stop" , '=' ) ,
152194 ( '›' , "Single Right-Pointing Angle Quotation Mark" , '>' ) ,
153195 ( '❯' , "Heavy Right-Pointing Angle Quotation Mark Ornament" , '>' ) ,
154196 ( '˃' , "Modifier Letter Right Arrowhead" , '>' ) ,
197+ ( '〉' , "Right Angle Bracket" , '>' ) ,
198+ ( '》' , "Right Double Angle Bracket" , '>' ) ,
155199 ( 'Ⲻ' , "Coptic Capital Letter Dialect-P Ni" , '-' ) ,
156200 ( 'Ɂ' , "Latin Capital Letter Glottal Stop" , '?' ) ,
157201 ( 'Ⳇ' , "Coptic Capital Letter Old Coptic Esh" , '/' ) , ] ;
158202
159203const ASCII_ARRAY : & ' static [ ( char , & ' static str ) ] = & [
204+ ( ' ' , "Space" ) ,
160205 ( '_' , "Underscore" ) ,
161206 ( '-' , "Minus/Hyphen" ) ,
162207 ( ',' , "Comma" ) ,
@@ -169,6 +214,8 @@ const ASCII_ARRAY: &'static [(char, &'static str)] = &[
169214 ( '"' , "Quotation Mark" ) ,
170215 ( '(' , "Left Parenthesis" ) ,
171216 ( ')' , "Right Parenthesis" ) ,
217+ ( '[' , "Left Square Bracket" ) ,
218+ ( ']' , "Right Square Bracket" ) ,
172219 ( '{' , "Left Curly Brace" ) ,
173220 ( '}' , "Right Curly Brace" ) ,
174221 ( '*' , "Asterisk" ) ,
0 commit comments