diff options
| author | Eli Zaretskii | 2012-02-18 13:36:54 +0200 |
|---|---|---|
| committer | Eli Zaretskii | 2012-02-18 13:36:54 +0200 |
| commit | 57939ff41e57b4e24c00aa875046d103b46e066c (patch) | |
| tree | 89e8c93de342fde230e04edf40a67a342eed07b0 | |
| parent | 0c23686e58f426f1a94831b0453ddcaa46746f77 (diff) | |
| download | emacs-57939ff41e57b4e24c00aa875046d103b46e066c.tar.gz emacs-57939ff41e57b4e24c00aa875046d103b46e066c.zip | |
Update char-script-table from the latest Unicode Database.
lisp/international/characters.el (script-list): Sync with the latest
Unicode Character Database.
| -rw-r--r-- | lisp/ChangeLog | 5 | ||||
| -rw-r--r-- | lisp/international/characters.el | 109 |
2 files changed, 100 insertions, 14 deletions
diff --git a/lisp/ChangeLog b/lisp/ChangeLog index 14e2596e43d..1980d18d3b4 100644 --- a/lisp/ChangeLog +++ b/lisp/ChangeLog | |||
| @@ -1,3 +1,8 @@ | |||
| 1 | 2012-02-18 Eli Zaretskii <eliz@gnu.org> | ||
| 2 | |||
| 3 | * international/characters.el (script-list): Sync with the latest | ||
| 4 | Unicode Character Database. | ||
| 5 | |||
| 1 | 2012-02-18 Andreas Schwab <schwab@linux-m68k.org> | 6 | 2012-02-18 Andreas Schwab <schwab@linux-m68k.org> |
| 2 | 7 | ||
| 3 | * international/titdic-cnv.el: Remove duplicate coding tag. | 8 | * international/titdic-cnv.el: Remove duplicate coding tag. |
diff --git a/lisp/international/characters.el b/lisp/international/characters.el index 4b8ed3e21e2..ba8b8955fba 100644 --- a/lisp/international/characters.el +++ b/lisp/international/characters.el | |||
| @@ -1114,6 +1114,12 @@ Setup char-width-table appropriate for non-CJK language environment." | |||
| 1114 | 1114 | ||
| 1115 | ;; Setting char-script-table. | 1115 | ;; Setting char-script-table. |
| 1116 | 1116 | ||
| 1117 | ;; The data is compiled from Blocks.txt and Scripts.txt in the | ||
| 1118 | ;; "Unicode Character Database", simplified to lump together all the | ||
| 1119 | ;; blocks belonging to the same language. E.g., "Basic Latin", | ||
| 1120 | ;; "Latin-1 Supplement", "Latin Extended-A", etc. are all lumped | ||
| 1121 | ;; together under "latin". | ||
| 1122 | ;; | ||
| 1117 | ;; The Unicode blocks actually extend past some of these ranges with | 1123 | ;; The Unicode blocks actually extend past some of these ranges with |
| 1118 | ;; undefined codepoints. | 1124 | ;; undefined codepoints. |
| 1119 | (let ((script-list nil)) | 1125 | (let ((script-list nil)) |
| @@ -1126,13 +1132,17 @@ Setup char-width-table appropriate for non-CJK language environment." | |||
| 1126 | (#x0370 #x03E1 greek) | 1132 | (#x0370 #x03E1 greek) |
| 1127 | (#x03E2 #x03EF coptic) | 1133 | (#x03E2 #x03EF coptic) |
| 1128 | (#x03F0 #x03F3 greek) | 1134 | (#x03F0 #x03F3 greek) |
| 1129 | (#x0400 #x04FF cyrillic) | 1135 | (#x0400 #x052F cyrillic) |
| 1130 | (#x0530 #x058F armenian) | 1136 | (#x0530 #x058F armenian) |
| 1131 | (#x0590 #x05FF hebrew) | 1137 | (#x0590 #x05FF hebrew) |
| 1132 | (#x0600 #x06FF arabic) | 1138 | (#x0600 #x06FF arabic) |
| 1133 | (#x0700 #x074F syriac) | 1139 | (#x0700 #x074F syriac) |
| 1134 | (#x07C0 #x07FA nko) | 1140 | (#x0750 #x077F arabic) |
| 1135 | (#x0780 #x07BF thaana) | 1141 | (#x0780 #x07BF thaana) |
| 1142 | (#x07C0 #x07FF nko) | ||
| 1143 | (#x0800 #x083F samaritan) | ||
| 1144 | (#x0840 #x085F mandaic) | ||
| 1145 | (#x08A0 #x08FF arabic) | ||
| 1136 | (#x0900 #x097F devanagari) | 1146 | (#x0900 #x097F devanagari) |
| 1137 | (#x0980 #x09FF bengali) | 1147 | (#x0980 #x09FF bengali) |
| 1138 | (#x0A00 #x0A7F gurmukhi) | 1148 | (#x0A00 #x0A7F gurmukhi) |
| @@ -1143,10 +1153,10 @@ Setup char-width-table appropriate for non-CJK language environment." | |||
| 1143 | (#x0C80 #x0CFF kannada) | 1153 | (#x0C80 #x0CFF kannada) |
| 1144 | (#x0D00 #x0D7F malayalam) | 1154 | (#x0D00 #x0D7F malayalam) |
| 1145 | (#x0D80 #x0DFF sinhala) | 1155 | (#x0D80 #x0DFF sinhala) |
| 1146 | (#x0E00 #x0E5F thai) | 1156 | (#x0E00 #x0E7F thai) |
| 1147 | (#x0E80 #x0EDF lao) | 1157 | (#x0E80 #x0EFF lao) |
| 1148 | (#x0F00 #x0FFF tibetan) | 1158 | (#x0F00 #x0FFF tibetan) |
| 1149 | (#x1000 #x109F burmese) | 1159 | (#x1000 #x109F burmese) ; according to Unicode 6.1, should be "myanmar" |
| 1150 | (#x10A0 #x10FF georgian) | 1160 | (#x10A0 #x10FF georgian) |
| 1151 | (#x1100 #x11FF hangul) | 1161 | (#x1100 #x11FF hangul) |
| 1152 | (#x1200 #x139F ethiopic) | 1162 | (#x1200 #x139F ethiopic) |
| @@ -1154,14 +1164,40 @@ Setup char-width-table appropriate for non-CJK language environment." | |||
| 1154 | (#x1400 #x167F canadian-aboriginal) | 1164 | (#x1400 #x167F canadian-aboriginal) |
| 1155 | (#x1680 #x169F ogham) | 1165 | (#x1680 #x169F ogham) |
| 1156 | (#x16A0 #x16FF runic) | 1166 | (#x16A0 #x16FF runic) |
| 1167 | (#x1700 #x171F tagalog) | ||
| 1168 | (#x1720 #x173F hanunoo) | ||
| 1169 | (#x1740 #x175F buhid) | ||
| 1170 | (#x1760 #x177F tagbanwa) | ||
| 1157 | (#x1780 #x17FF khmer) | 1171 | (#x1780 #x17FF khmer) |
| 1158 | (#x1800 #x18AF mongolian) | 1172 | (#x1800 #x18AF mongolian) |
| 1159 | (#x1D00 #x1DFF phonetic) | 1173 | (#x18B0 #x18FF canadian-aboriginal) |
| 1160 | (#x1E00 #x1EFF latin) | 1174 | (#x1900 #x194F limbu) |
| 1175 | (#x1950 #x197F tai-le) | ||
| 1176 | (#x1980 #x19DF tai-lue) | ||
| 1177 | (#x19E0 #x19FF khmer) | ||
| 1178 | (#x1A00 #x1A00 buginese) | ||
| 1179 | (#x1A20 #x1AAF tai-tham) | ||
| 1180 | (#x1B00 #x1B7F balinese) | ||
| 1181 | (#x1B80 #x1BBF sundanese) | ||
| 1182 | (#x1BC0 #x1BFF batak) | ||
| 1183 | (#x1C00 #x1C4F lepcha) | ||
| 1184 | (#x1C50 #x1C7F ol-chiki) | ||
| 1185 | (#x1CC0 #x1CCF sundanese) | ||
| 1186 | (#x1CD0 #x1CFF vedic) | ||
| 1187 | (#x1D00 #x1DBF phonetic) | ||
| 1188 | (#x1DC0 #x1EFF latin) | ||
| 1161 | (#x1F00 #x1FFF greek) | 1189 | (#x1F00 #x1FFF greek) |
| 1162 | (#x2000 #x27FF symbol) | 1190 | (#x2000 #x27FF symbol) |
| 1163 | (#x2800 #x28FF braille) | 1191 | (#x2800 #x28FF braille) |
| 1192 | (#x2900 #x2BFF symbol) | ||
| 1193 | (#x2C00 #x2C5F glagolitic) | ||
| 1194 | (#x2C60 #x2C7F latin) | ||
| 1195 | (#x2C80 #x2CFF coptic) | ||
| 1196 | (#x2D00 #x2D2F georgian) | ||
| 1197 | (#x2D30 #x2D7F tifinagh) | ||
| 1164 | (#x2D80 #x2DDF ethiopic) | 1198 | (#x2D80 #x2DDF ethiopic) |
| 1199 | (#x2DE0 #x2DFF cyrillic) | ||
| 1200 | (#x2E00 #x2E7F symbol) | ||
| 1165 | (#x2E80 #x2FDF han) | 1201 | (#x2E80 #x2FDF han) |
| 1166 | (#x2FF0 #x2FFF ideographic-description) | 1202 | (#x2FF0 #x2FFF ideographic-description) |
| 1167 | (#x3000 #x303F cjk-misc) | 1203 | (#x3000 #x303F cjk-misc) |
| @@ -1170,47 +1206,92 @@ Setup char-width-table appropriate for non-CJK language environment." | |||
| 1170 | (#x3130 #x318F hangul) | 1206 | (#x3130 #x318F hangul) |
| 1171 | (#x3190 #x319F kanbun) | 1207 | (#x3190 #x319F kanbun) |
| 1172 | (#x31A0 #x31BF bopomofo) | 1208 | (#x31A0 #x31BF bopomofo) |
| 1173 | (#x3400 #x9FAF han) | 1209 | (#x31C0 #x31EF cjk-misc) |
| 1210 | (#x31F0 #x31FF kana) | ||
| 1211 | (#x3200 #x9FAF han) | ||
| 1174 | (#xA000 #xA4CF yi) | 1212 | (#xA000 #xA4CF yi) |
| 1213 | (#xA4D0 #xA4FF lisu) | ||
| 1214 | (#xA500 #xA63F vai) | ||
| 1215 | (#xA640 #xA69F cyrillic) | ||
| 1216 | (#xA6A0 #xA6FF bamum) | ||
| 1217 | (#xA700 #xA7FF latin) | ||
| 1218 | (#xA800 #xA82F syloti-nagri) | ||
| 1219 | (#xA830 #xA83F north-indic-number) | ||
| 1220 | (#xA840 #xA87F phags-pa) | ||
| 1221 | (#xA880 #xA8DF saurashtra) | ||
| 1222 | (#xA8E0 #xA8FF devanagari) | ||
| 1223 | (#xA900 #xA92F kayah-li) | ||
| 1224 | (#xA930 #xA95F rejang) | ||
| 1225 | (#xA960 #xA97F hangul) | ||
| 1226 | (#xA980 #xA9DF javanese) | ||
| 1175 | (#xAA00 #xAA5F cham) | 1227 | (#xAA00 #xAA5F cham) |
| 1176 | (#xAA60 #xAA7B burmese) | 1228 | (#xAA60 #xAA7B burmese) ; Unicode 6.1: "myanmar" |
| 1177 | (#xAA80 #xAADF tai-viet) | 1229 | (#xAA80 #xAADF tai-viet) |
| 1178 | (#xAC00 #xD7AF hangul) | 1230 | (#xAAE0 #xAAFF meetei-mayek) |
| 1231 | (#xAB00 #xAB2F ethiopic) | ||
| 1232 | (#xABC0 #xABFF meetei-mayek) | ||
| 1233 | (#xAC00 #xD7FF hangul) | ||
| 1179 | (#xF900 #xFAFF han) | 1234 | (#xF900 #xFAFF han) |
| 1180 | (#xFB1D #xFB4F hebrew) | 1235 | (#xFB1D #xFB4F hebrew) |
| 1181 | (#xFB50 #xFDFF arabic) | 1236 | (#xFB50 #xFDFF arabic) |
| 1182 | (#xFE70 #xFEFC arabic) | 1237 | (#xFE30 #xFE4F han) |
| 1238 | (#xFE70 #xFEFF arabic) | ||
| 1183 | (#xFF00 #xFF5F cjk-misc) | 1239 | (#xFF00 #xFF5F cjk-misc) |
| 1184 | (#xFF61 #xFF9F kana) | 1240 | (#xFF61 #xFF9F kana) |
| 1185 | (#xFFE0 #xFFE6 cjk-misc) | 1241 | (#xFFE0 #xFFE6 cjk-misc) |
| 1186 | (#x10000 #x100FF linear-b) | 1242 | (#x10000 #x100FF linear-b) |
| 1187 | (#x10100 #x1013F aegean-number) | 1243 | (#x10100 #x1013F aegean-number) |
| 1188 | (#x10140 #x1018A ancient-greek-number) | 1244 | (#x10140 #x1018F ancient-greek-number) |
| 1189 | (#x10190 #x1019B ancient-symbol) | 1245 | (#x10190 #x101CF ancient-symbol) |
| 1190 | (#x101D0 #x101FF phaistos-disc) | 1246 | (#x101D0 #x101FF phaistos-disc) |
| 1191 | (#x10280 #x1029F lycian) | 1247 | (#x10280 #x1029F lycian) |
| 1192 | (#x102A0 #x102DF carian) | 1248 | (#x102A0 #x102DF carian) |
| 1193 | (#x10300 #x1032F olt-italic) | 1249 | (#x10300 #x1032F olt-italic) |
| 1250 | (#x10330 #x1034F gothic) | ||
| 1194 | (#x10380 #x1039F ugaritic) | 1251 | (#x10380 #x1039F ugaritic) |
| 1195 | (#x103A0 #x103DF old-persian) | 1252 | (#x103A0 #x103DF old-persian) |
| 1196 | (#x10400 #x1044F deseret) | 1253 | (#x10400 #x1044F deseret) |
| 1197 | (#x10450 #x1047F shavian) | 1254 | (#x10450 #x1047F shavian) |
| 1198 | (#x10480 #x104AF osmanya) | 1255 | (#x10480 #x104AF osmanya) |
| 1199 | (#x10800 #x1083F cypriot-syllabary) | 1256 | (#x10800 #x1083F cypriot-syllabary) |
| 1257 | (#x10840 #x1085F aramaic) | ||
| 1200 | (#x10900 #x1091F phoenician) | 1258 | (#x10900 #x1091F phoenician) |
| 1201 | (#x10920 #x1093F lydian) | 1259 | (#x10920 #x1093F lydian) |
| 1260 | (#x10980 #x109FF meroitic) | ||
| 1202 | (#x10A00 #x10A5F kharoshthi) | 1261 | (#x10A00 #x10A5F kharoshthi) |
| 1262 | (#x10A60 #x10A7F old-south-arabian) | ||
| 1263 | (#x10B00 #x10B3F avestan) | ||
| 1264 | (#x10B40 #x10B5F inscriptional-parthian) | ||
| 1265 | (#x10B60 #x10B7F inscriptional-pahlavi) | ||
| 1266 | (#x10C00 #x10C4F old-turkic) | ||
| 1267 | (#x10E60 #x10E7F rumi-number) | ||
| 1268 | (#x11000 #x1107F brahmi) | ||
| 1269 | (#x11080 #x110CF kaithi) | ||
| 1270 | (#x110D0 #x110FF sora-sompeng) | ||
| 1271 | (#x11100 #x1114F chakma) | ||
| 1272 | (#x11180 #x111DF sharada) | ||
| 1273 | (#x11680 #x116CF takri) | ||
| 1203 | (#x12000 #x123FF cuneiform) | 1274 | (#x12000 #x123FF cuneiform) |
| 1204 | (#x12400 #x1247F cuneiform-numbers-and-punctuation) | 1275 | (#x12400 #x1247F cuneiform-numbers-and-punctuation) |
| 1276 | (#x13000 #x1342F egyptian) | ||
| 1277 | (#x16800 #x16A3F bamum) | ||
| 1278 | (#x16F00 #x16F9F miao) | ||
| 1279 | (#x1B000 #x1B0FF kana) | ||
| 1205 | (#x1D000 #x1D0FF byzantine-musical-symbol) | 1280 | (#x1D000 #x1D0FF byzantine-musical-symbol) |
| 1206 | (#x1D100 #x1D1FF musical-symbol) | 1281 | (#x1D100 #x1D1FF musical-symbol) |
| 1207 | (#x1D200 #x1D24F ancient-greek-musical-notation) | 1282 | (#x1D200 #x1D24F ancient-greek-musical-notation) |
| 1208 | (#x1D300 #x1D35F tai-xuan-jing-symbol) | 1283 | (#x1D300 #x1D35F tai-xuan-jing-symbol) |
| 1209 | (#x1D360 #x1D37F counting-rod-numeral) | 1284 | (#x1D360 #x1D37F counting-rod-numeral) |
| 1210 | (#x1D400 #x1D7FF mathematical) | 1285 | (#x1D400 #x1D7FF mathematical) |
| 1286 | (#x1EE00 #x1EEFF arabic) | ||
| 1211 | (#x1F000 #x1F02F mahjong-tile) | 1287 | (#x1F000 #x1F02F mahjong-tile) |
| 1212 | (#x1F030 #x1F09F domino-tile) | 1288 | (#x1F030 #x1F09F domino-tile) |
| 1213 | (#x20000 #x2AFFF han) | 1289 | (#x1F0A0 #x1F0FF playing-cards) |
| 1290 | (#x1F100 #x1F1FF symbol) | ||
| 1291 | (#x1F200 #x1F2FF han) | ||
| 1292 | (#x1F300 #x1F64F symbol) | ||
| 1293 | (#x1F680 #x1F77F symbol) | ||
| 1294 | (#x20000 #x2B81F han) | ||
| 1214 | (#x2F800 #x2FFFF han))) | 1295 | (#x2F800 #x2FFFF han))) |
| 1215 | (set-char-table-range char-script-table | 1296 | (set-char-table-range char-script-table |
| 1216 | (cons (car elt) (nth 1 elt)) (nth 2 elt)) | 1297 | (cons (car elt) (nth 1 elt)) (nth 2 elt)) |