@@ -24,14 +24,18 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
24
24
( '‑' , "Non-Breaking Hyphen" , '-' ) ,
25
25
( '‒' , "Figure Dash" , '-' ) ,
26
26
( '–' , "En Dash" , '-' ) ,
27
+ ( '—' , "Em Dash" , '-' ) ,
27
28
( '﹘' , "Small Em Dash" , '-' ) ,
28
29
( '⁃' , "Hyphen Bullet" , '-' ) ,
29
30
( '˗' , "Modifier Letter Minus Sign" , '-' ) ,
30
31
( '−' , "Minus Sign" , '-' ) ,
32
+ ( 'ー' , "Katakana-Hiragana Prolonged Sound Mark" , '-' ) ,
31
33
( '٫' , "Arabic Decimal Separator" , ',' ) ,
32
34
( '‚' , "Single Low-9 Quotation Mark" , ',' ) ,
33
35
( 'ꓹ' , "Lisu Letter Tone Na Po" , ',' ) ,
36
+ ( ',' , "Fullwidth Comma" , ',' ) ,
34
37
( ';' , "Greek Question Mark" , ';' ) ,
38
+ ( ';' , "Fullwidth Semicolon" , ';' ) ,
35
39
( 'ः' , "Devanagari Sign Visarga" , ':' ) ,
36
40
( 'ઃ' , "Gujarati Sign Visarga" , ':' ) ,
37
41
( ':' , "Fullwidth Colon" , ':' ) ,
@@ -53,16 +57,20 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
53
57
( 'ʔ' , "Latin Letter Glottal Stop" , '?' ) ,
54
58
( 'ॽ' , "Devanagari Letter Glottal Stop" , '?' ) ,
55
59
( 'Ꭾ' , "Cherokee Letter He" , '?' ) ,
60
+ ( '?' , "Fullwidth Question Mark" , '?' ) ,
56
61
( '𝅭' , "Musical Symbol Combining Augmentation Dot" , '.' ) ,
57
62
( '․' , "One Dot Leader" , '.' ) ,
58
63
( '۔' , "Arabic Full Stop" , '.' ) ,
59
64
( '܁' , "Syriac Supralinear Full Stop" , '.' ) ,
60
65
( '܂' , "Syriac Sublinear Full Stop" , '.' ) ,
61
66
( '꘎' , "Vai Full Stop" , '.' ) ,
62
67
( '𐩐' , "Kharoshthi Punctuation Dot" , '.' ) ,
68
+ ( '·' , "Middle Dot" , '.' ) ,
63
69
( '٠' , "Arabic-Indic Digit Zero" , '.' ) ,
64
70
( '۰' , "Extended Arabic-Indic Digit Zero" , '.' ) ,
65
71
( 'ꓸ' , "Lisu Letter Tone Mya Ti" , '.' ) ,
72
+ ( '。' , "Ideographic Full Stop" , '.' ) ,
73
+ ( '・' , "Katakana Middle Dot" , '.' ) ,
66
74
( '՝' , "Armenian Comma" , '\'' ) ,
67
75
( ''' , "Fullwidth Apostrophe" , '\'' ) ,
68
76
( '‘' , "Left Single Quotation Mark" , '\'' ) ,
@@ -113,11 +121,13 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
113
121
( '❲' , "Light Left Tortoise Shell Bracket Ornament" , '(' ) ,
114
122
( '〔' , "Left Tortoise Shell Bracket" , '(' ) ,
115
123
( '﴾' , "Ornate Left Parenthesis" , '(' ) ,
124
+ ( '(' , "Fullwidth Left Parenthesis" , '(' ) ,
116
125
( ']' , "Fullwidth Right Square Bracket" , ')' ) ,
117
126
( '❩' , "Medium Right Parenthesis Ornament" , ')' ) ,
118
127
( '❳' , "Light Right Tortoise Shell Bracket Ornament" , ')' ) ,
119
128
( '〕' , "Right Tortoise Shell Bracket" , ')' ) ,
120
129
( '﴿' , "Ornate Right Parenthesis" , ')' ) ,
130
+ ( ')' , "Fullwidth Right Parenthesis" , ')' ) ,
121
131
( '❴' , "Medium Left Curly Bracket Ornament" , '{' ) ,
122
132
( '❵' , "Medium Right Curly Bracket Ornament" , '}' ) ,
123
133
( '⁎' , "Low Asterisk" , '*' ) ,
@@ -140,6 +150,8 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
140
150
( '⟍' , "Mathematical Falling Diagonal" , '\\' ) ,
141
151
( '⧵' , "Reverse Solidus Operator" , '\\' ) ,
142
152
( '⧹' , "Big Reverse Solidus" , '\\' ) ,
153
+ ( '、' , "Ideographic Comma" , '\\' ) ,
154
+ ( 'ヽ' , "Katakana Iteration Mark" , '\\' ) ,
143
155
( '㇔' , "Cjk Stroke D" , '\\' ) ,
144
156
( '丶' , "Cjk Unified Ideograph-4E36" , '\\' ) ,
145
157
( '⼂' , "Kangxi Radical Dot" , '\\' ) ,
@@ -148,10 +160,14 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
148
160
( '‹' , "Single Left-Pointing Angle Quotation Mark" , '<' ) ,
149
161
( '❮' , "Heavy Left-Pointing Angle Quotation Mark Ornament" , '<' ) ,
150
162
( '˂' , "Modifier Letter Left Arrowhead" , '<' ) ,
163
+ ( '〈' , "Left Angle Bracket" , '<' ) ,
164
+ ( '《' , "Left Double Angle Bracket" , '<' ) ,
151
165
( '꓿' , "Lisu Punctuation Full Stop" , '=' ) ,
152
166
( '›' , "Single Right-Pointing Angle Quotation Mark" , '>' ) ,
153
167
( '❯' , "Heavy Right-Pointing Angle Quotation Mark Ornament" , '>' ) ,
154
168
( '˃' , "Modifier Letter Right Arrowhead" , '>' ) ,
169
+ ( '〉' , "Right Angle Bracket" , '>' ) ,
170
+ ( '》' , "Right Double Angle Bracket" , '>' ) ,
155
171
( 'Ⲻ' , "Coptic Capital Letter Dialect-P Ni" , '-' ) ,
156
172
( 'Ɂ' , "Latin Capital Letter Glottal Stop" , '?' ) ,
157
173
( 'Ⳇ' , "Coptic Capital Letter Old Coptic Esh" , '/' ) , ] ;
0 commit comments