Skip to content

Commit dbe700e

Browse files
committed
add more characters easily inputtable with CJK IMEs
1 parent 95545e7 commit dbe700e

File tree

1 file changed

+16
-0
lines changed

1 file changed

+16
-0
lines changed

src/libsyntax/parse/lexer/unicode_chars.rs

+16
Original file line numberDiff line numberDiff line change
@@ -24,14 +24,18 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
2424
('‑', "Non-Breaking Hyphen", '-'),
2525
('‒', "Figure Dash", '-'),
2626
('–', "En Dash", '-'),
27+
('—', "Em Dash", '-'),
2728
('﹘', "Small Em Dash", '-'),
2829
('⁃', "Hyphen Bullet", '-'),
2930
('˗', "Modifier Letter Minus Sign", '-'),
3031
('−', "Minus Sign", '-'),
32+
('ー', "Katakana-Hiragana Prolonged Sound Mark", '-'),
3133
('٫', "Arabic Decimal Separator", ','),
3234
('‚', "Single Low-9 Quotation Mark", ','),
3335
('ꓹ', "Lisu Letter Tone Na Po", ','),
36+
(',', "Fullwidth Comma", ','),
3437
(';', "Greek Question Mark", ';'),
38+
(';', "Fullwidth Semicolon", ';'),
3539
('ः', "Devanagari Sign Visarga", ':'),
3640
('ઃ', "Gujarati Sign Visarga", ':'),
3741
(':', "Fullwidth Colon", ':'),
@@ -53,16 +57,20 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
5357
('ʔ', "Latin Letter Glottal Stop", '?'),
5458
('ॽ', "Devanagari Letter Glottal Stop", '?'),
5559
('Ꭾ', "Cherokee Letter He", '?'),
60+
('?', "Fullwidth Question Mark", '?'),
5661
('𝅭', "Musical Symbol Combining Augmentation Dot", '.'),
5762
('․', "One Dot Leader", '.'),
5863
('۔', "Arabic Full Stop", '.'),
5964
('܁', "Syriac Supralinear Full Stop", '.'),
6065
('܂', "Syriac Sublinear Full Stop", '.'),
6166
('꘎', "Vai Full Stop", '.'),
6267
('𐩐', "Kharoshthi Punctuation Dot", '.'),
68+
('·', "Middle Dot", '.'),
6369
('٠', "Arabic-Indic Digit Zero", '.'),
6470
('۰', "Extended Arabic-Indic Digit Zero", '.'),
6571
('ꓸ', "Lisu Letter Tone Mya Ti", '.'),
72+
('。', "Ideographic Full Stop", '.'),
73+
('・', "Katakana Middle Dot", '.'),
6674
('՝', "Armenian Comma", '\''),
6775
(''', "Fullwidth Apostrophe", '\''),
6876
('‘', "Left Single Quotation Mark", '\''),
@@ -113,11 +121,13 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
113121
('❲', "Light Left Tortoise Shell Bracket Ornament", '('),
114122
('〔', "Left Tortoise Shell Bracket", '('),
115123
('﴾', "Ornate Left Parenthesis", '('),
124+
('(', "Fullwidth Left Parenthesis", '('),
116125
(']', "Fullwidth Right Square Bracket", ')'),
117126
('❩', "Medium Right Parenthesis Ornament", ')'),
118127
('❳', "Light Right Tortoise Shell Bracket Ornament", ')'),
119128
('〕', "Right Tortoise Shell Bracket", ')'),
120129
('﴿', "Ornate Right Parenthesis", ')'),
130+
(')', "Fullwidth Right Parenthesis", ')'),
121131
('❴', "Medium Left Curly Bracket Ornament", '{'),
122132
('❵', "Medium Right Curly Bracket Ornament", '}'),
123133
('⁎', "Low Asterisk", '*'),
@@ -140,6 +150,8 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
140150
('⟍', "Mathematical Falling Diagonal", '\\'),
141151
('⧵', "Reverse Solidus Operator", '\\'),
142152
('⧹', "Big Reverse Solidus", '\\'),
153+
('、', "Ideographic Comma", '\\'),
154+
('ヽ', "Katakana Iteration Mark", '\\'),
143155
('㇔', "Cjk Stroke D", '\\'),
144156
('丶', "Cjk Unified Ideograph-4E36", '\\'),
145157
('⼂', "Kangxi Radical Dot", '\\'),
@@ -148,10 +160,14 @@ const UNICODE_ARRAY: &'static [(char, &'static str, char)] = &[
148160
('‹', "Single Left-Pointing Angle Quotation Mark", '<'),
149161
('❮', "Heavy Left-Pointing Angle Quotation Mark Ornament", '<'),
150162
('˂', "Modifier Letter Left Arrowhead", '<'),
163+
('〈', "Left Angle Bracket", '<'),
164+
('《', "Left Double Angle Bracket", '<'),
151165
('꓿', "Lisu Punctuation Full Stop", '='),
152166
('›', "Single Right-Pointing Angle Quotation Mark", '>'),
153167
('❯', "Heavy Right-Pointing Angle Quotation Mark Ornament", '>'),
154168
('˃', "Modifier Letter Right Arrowhead", '>'),
169+
('〉', "Right Angle Bracket", '>'),
170+
('》', "Right Double Angle Bracket", '>'),
155171
('Ⲻ', "Coptic Capital Letter Dialect-P Ni", '-'),
156172
('Ɂ', "Latin Capital Letter Glottal Stop", '?'),
157173
('Ⳇ', "Coptic Capital Letter Old Coptic Esh", '/'), ];

0 commit comments

Comments
 (0)