@@ -24,14 +24,18 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
2424 ( '‑' , "Non-Breaking Hyphen" , '-' ) ,
2525 ( '‒' , "Figure Dash" , '-' ) ,
2626 ( '–' , "En Dash" , '-' ) ,
27+ ( '—' , "Em Dash" , '-' ) ,
2728 ( '﹘' , "Small Em Dash" , '-' ) ,
2829 ( '⁃' , "Hyphen Bullet" , '-' ) ,
2930 ( '˗' , "Modifier Letter Minus Sign" , '-' ) ,
3031 ( '−' , "Minus Sign" , '-' ) ,
32+ ( 'ー' , "Katakana-Hiragana Prolonged Sound Mark" , '-' ) ,
3133 ( '٫' , "Arabic Decimal Separator" , ',' ) ,
3234 ( '‚' , "Single Low-9 Quotation Mark" , ',' ) ,
3335 ( 'ꓹ' , "Lisu Letter Tone Na Po" , ',' ) ,
36+ ( ',' , "Fullwidth Comma" , ',' ) ,
3437 ( ';' , "Greek Question Mark" , ';' ) ,
38+ ( ';' , "Fullwidth Semicolon" , ';' ) ,
3539 ( 'ः' , "Devanagari Sign Visarga" , ':' ) ,
3640 ( 'ઃ' , "Gujarati Sign Visarga" , ':' ) ,
3741 ( ':' , "Fullwidth Colon" , ':' ) ,
@@ -53,16 +57,20 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
5357 ( 'ʔ' , "Latin Letter Glottal Stop" , '?' ) ,
5458 ( 'ॽ' , "Devanagari Letter Glottal Stop" , '?' ) ,
5559 ( 'Ꭾ' , "Cherokee Letter He" , '?' ) ,
60+ ( '?' , "Fullwidth Question Mark" , '?' ) ,
5661 ( '𝅭' , "Musical Symbol Combining Augmentation Dot" , '.' ) ,
5762 ( '․' , "One Dot Leader" , '.' ) ,
5863 ( '۔' , "Arabic Full Stop" , '.' ) ,
5964 ( '܁' , "Syriac Supralinear Full Stop" , '.' ) ,
6065 ( '܂' , "Syriac Sublinear Full Stop" , '.' ) ,
6166 ( '꘎' , "Vai Full Stop" , '.' ) ,
6267 ( '𐩐' , "Kharoshthi Punctuation Dot" , '.' ) ,
68+ ( '·' , "Middle Dot" , '.' ) ,
6369 ( '٠' , "Arabic-Indic Digit Zero" , '.' ) ,
6470 ( '۰' , "Extended Arabic-Indic Digit Zero" , '.' ) ,
6571 ( 'ꓸ' , "Lisu Letter Tone Mya Ti" , '.' ) ,
72+ ( '。' , "Ideographic Full Stop" , '.' ) ,
73+ ( '・' , "Katakana Middle Dot" , '.' ) ,
6674 ( '՝' , "Armenian Comma" , '\'' ) ,
6775 ( ''' , "Fullwidth Apostrophe" , '\'' ) ,
6876 ( '‘' , "Left Single Quotation Mark" , '\'' ) ,
@@ -113,11 +121,13 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
113121 ( '❲' , "Light Left Tortoise Shell Bracket Ornament" , '(' ) ,
114122 ( '〔' , "Left Tortoise Shell Bracket" , '(' ) ,
115123 ( '﴾' , "Ornate Left Parenthesis" , '(' ) ,
124+ ( '(' , "Fullwidth Left Parenthesis" , '(' ) ,
116125 ( ']' , "Fullwidth Right Square Bracket" , ')' ) ,
117126 ( '❩' , "Medium Right Parenthesis Ornament" , ')' ) ,
118127 ( '❳' , "Light Right Tortoise Shell Bracket Ornament" , ')' ) ,
119128 ( '〕' , "Right Tortoise Shell Bracket" , ')' ) ,
120129 ( '﴿' , "Ornate Right Parenthesis" , ')' ) ,
130+ ( ')' , "Fullwidth Right Parenthesis" , ')' ) ,
121131 ( '❴' , "Medium Left Curly Bracket Ornament" , '{' ) ,
122132 ( '❵' , "Medium Right Curly Bracket Ornament" , '}' ) ,
123133 ( '⁎' , "Low Asterisk" , '*' ) ,
@@ -140,6 +150,8 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
140150 ( '⟍' , "Mathematical Falling Diagonal" , '\\' ) ,
141151 ( '⧵' , "Reverse Solidus Operator" , '\\' ) ,
142152 ( '⧹' , "Big Reverse Solidus" , '\\' ) ,
153+ ( '、' , "Ideographic Comma" , '\\' ) ,
154+ ( 'ヽ' , "Katakana Iteration Mark" , '\\' ) ,
143155 ( '㇔' , "Cjk Stroke D" , '\\' ) ,
144156 ( '丶' , "Cjk Unified Ideograph-4E36" , '\\' ) ,
145157 ( '⼂' , "Kangxi Radical Dot" , '\\' ) ,
@@ -148,10 +160,14 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
148160 ( '‹' , "Single Left-Pointing Angle Quotation Mark" , '<' ) ,
149161 ( '❮' , "Heavy Left-Pointing Angle Quotation Mark Ornament" , '<' ) ,
150162 ( '˂' , "Modifier Letter Left Arrowhead" , '<' ) ,
163+ ( '〈' , "Left Angle Bracket" , '<' ) ,
164+ ( '《' , "Left Double Angle Bracket" , '<' ) ,
151165 ( '꓿' , "Lisu Punctuation Full Stop" , '=' ) ,
152166 ( '›' , "Single Right-Pointing Angle Quotation Mark" , '>' ) ,
153167 ( '❯' , "Heavy Right-Pointing Angle Quotation Mark Ornament" , '>' ) ,
154168 ( '˃' , "Modifier Letter Right Arrowhead" , '>' ) ,
169+ ( '〉' , "Right Angle Bracket" , '>' ) ,
170+ ( '》' , "Right Double Angle Bracket" , '>' ) ,
155171 ( 'Ⲻ' , "Coptic Capital Letter Dialect-P Ni" , '-' ) ,
156172 ( 'Ɂ' , "Latin Capital Letter Glottal Stop" , '?' ) ,
157173 ( 'Ⳇ' , "Coptic Capital Letter Old Coptic Esh" , '/' ) , ] ;
0 commit comments