aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorEli Zaretskii2012-02-18 13:36:54 +0200
committerEli Zaretskii2012-02-18 13:36:54 +0200
commit57939ff41e57b4e24c00aa875046d103b46e066c (patch)
tree89e8c93de342fde230e04edf40a67a342eed07b0
parent0c23686e58f426f1a94831b0453ddcaa46746f77 (diff)
downloademacs-57939ff41e57b4e24c00aa875046d103b46e066c.tar.gz
emacs-57939ff41e57b4e24c00aa875046d103b46e066c.zip
Update char-script-table from the latest Unicode Database.
lisp/international/characters.el (script-list): Sync with the latest Unicode Character Database.
-rw-r--r--lisp/ChangeLog5
-rw-r--r--lisp/international/characters.el109
2 files changed, 100 insertions, 14 deletions
diff --git a/lisp/ChangeLog b/lisp/ChangeLog
index 14e2596e43d..1980d18d3b4 100644
--- a/lisp/ChangeLog
+++ b/lisp/ChangeLog
@@ -1,3 +1,8 @@
12012-02-18 Eli Zaretskii <eliz@gnu.org>
2
3 * international/characters.el (script-list): Sync with the latest
4 Unicode Character Database.
5
12012-02-18 Andreas Schwab <schwab@linux-m68k.org> 62012-02-18 Andreas Schwab <schwab@linux-m68k.org>
2 7
3 * international/titdic-cnv.el: Remove duplicate coding tag. 8 * international/titdic-cnv.el: Remove duplicate coding tag.
diff --git a/lisp/international/characters.el b/lisp/international/characters.el
index 4b8ed3e21e2..ba8b8955fba 100644
--- a/lisp/international/characters.el
+++ b/lisp/international/characters.el
@@ -1114,6 +1114,12 @@ Setup char-width-table appropriate for non-CJK language environment."
1114 1114
1115;; Setting char-script-table. 1115;; Setting char-script-table.
1116 1116
1117;; The data is compiled from Blocks.txt and Scripts.txt in the
1118;; "Unicode Character Database", simplified to lump together all the
1119;; blocks belonging to the same language. E.g., "Basic Latin",
1120;; "Latin-1 Supplement", "Latin Extended-A", etc. are all lumped
1121;; together under "latin".
1122;;
1117;; The Unicode blocks actually extend past some of these ranges with 1123;; The Unicode blocks actually extend past some of these ranges with
1118;; undefined codepoints. 1124;; undefined codepoints.
1119(let ((script-list nil)) 1125(let ((script-list nil))
@@ -1126,13 +1132,17 @@ Setup char-width-table appropriate for non-CJK language environment."
1126 (#x0370 #x03E1 greek) 1132 (#x0370 #x03E1 greek)
1127 (#x03E2 #x03EF coptic) 1133 (#x03E2 #x03EF coptic)
1128 (#x03F0 #x03F3 greek) 1134 (#x03F0 #x03F3 greek)
1129 (#x0400 #x04FF cyrillic) 1135 (#x0400 #x052F cyrillic)
1130 (#x0530 #x058F armenian) 1136 (#x0530 #x058F armenian)
1131 (#x0590 #x05FF hebrew) 1137 (#x0590 #x05FF hebrew)
1132 (#x0600 #x06FF arabic) 1138 (#x0600 #x06FF arabic)
1133 (#x0700 #x074F syriac) 1139 (#x0700 #x074F syriac)
1134 (#x07C0 #x07FA nko) 1140 (#x0750 #x077F arabic)
1135 (#x0780 #x07BF thaana) 1141 (#x0780 #x07BF thaana)
1142 (#x07C0 #x07FF nko)
1143 (#x0800 #x083F samaritan)
1144 (#x0840 #x085F mandaic)
1145 (#x08A0 #x08FF arabic)
1136 (#x0900 #x097F devanagari) 1146 (#x0900 #x097F devanagari)
1137 (#x0980 #x09FF bengali) 1147 (#x0980 #x09FF bengali)
1138 (#x0A00 #x0A7F gurmukhi) 1148 (#x0A00 #x0A7F gurmukhi)
@@ -1143,10 +1153,10 @@ Setup char-width-table appropriate for non-CJK language environment."
1143 (#x0C80 #x0CFF kannada) 1153 (#x0C80 #x0CFF kannada)
1144 (#x0D00 #x0D7F malayalam) 1154 (#x0D00 #x0D7F malayalam)
1145 (#x0D80 #x0DFF sinhala) 1155 (#x0D80 #x0DFF sinhala)
1146 (#x0E00 #x0E5F thai) 1156 (#x0E00 #x0E7F thai)
1147 (#x0E80 #x0EDF lao) 1157 (#x0E80 #x0EFF lao)
1148 (#x0F00 #x0FFF tibetan) 1158 (#x0F00 #x0FFF tibetan)
1149 (#x1000 #x109F burmese) 1159 (#x1000 #x109F burmese) ; according to Unicode 6.1, should be "myanmar"
1150 (#x10A0 #x10FF georgian) 1160 (#x10A0 #x10FF georgian)
1151 (#x1100 #x11FF hangul) 1161 (#x1100 #x11FF hangul)
1152 (#x1200 #x139F ethiopic) 1162 (#x1200 #x139F ethiopic)
@@ -1154,14 +1164,40 @@ Setup char-width-table appropriate for non-CJK language environment."
1154 (#x1400 #x167F canadian-aboriginal) 1164 (#x1400 #x167F canadian-aboriginal)
1155 (#x1680 #x169F ogham) 1165 (#x1680 #x169F ogham)
1156 (#x16A0 #x16FF runic) 1166 (#x16A0 #x16FF runic)
1167 (#x1700 #x171F tagalog)
1168 (#x1720 #x173F hanunoo)
1169 (#x1740 #x175F buhid)
1170 (#x1760 #x177F tagbanwa)
1157 (#x1780 #x17FF khmer) 1171 (#x1780 #x17FF khmer)
1158 (#x1800 #x18AF mongolian) 1172 (#x1800 #x18AF mongolian)
1159 (#x1D00 #x1DFF phonetic) 1173 (#x18B0 #x18FF canadian-aboriginal)
1160 (#x1E00 #x1EFF latin) 1174 (#x1900 #x194F limbu)
1175 (#x1950 #x197F tai-le)
1176 (#x1980 #x19DF tai-lue)
1177 (#x19E0 #x19FF khmer)
1178 (#x1A00 #x1A00 buginese)
1179 (#x1A20 #x1AAF tai-tham)
1180 (#x1B00 #x1B7F balinese)
1181 (#x1B80 #x1BBF sundanese)
1182 (#x1BC0 #x1BFF batak)
1183 (#x1C00 #x1C4F lepcha)
1184 (#x1C50 #x1C7F ol-chiki)
1185 (#x1CC0 #x1CCF sundanese)
1186 (#x1CD0 #x1CFF vedic)
1187 (#x1D00 #x1DBF phonetic)
1188 (#x1DC0 #x1EFF latin)
1161 (#x1F00 #x1FFF greek) 1189 (#x1F00 #x1FFF greek)
1162 (#x2000 #x27FF symbol) 1190 (#x2000 #x27FF symbol)
1163 (#x2800 #x28FF braille) 1191 (#x2800 #x28FF braille)
1192 (#x2900 #x2BFF symbol)
1193 (#x2C00 #x2C5F glagolitic)
1194 (#x2C60 #x2C7F latin)
1195 (#x2C80 #x2CFF coptic)
1196 (#x2D00 #x2D2F georgian)
1197 (#x2D30 #x2D7F tifinagh)
1164 (#x2D80 #x2DDF ethiopic) 1198 (#x2D80 #x2DDF ethiopic)
1199 (#x2DE0 #x2DFF cyrillic)
1200 (#x2E00 #x2E7F symbol)
1165 (#x2E80 #x2FDF han) 1201 (#x2E80 #x2FDF han)
1166 (#x2FF0 #x2FFF ideographic-description) 1202 (#x2FF0 #x2FFF ideographic-description)
1167 (#x3000 #x303F cjk-misc) 1203 (#x3000 #x303F cjk-misc)
@@ -1170,47 +1206,92 @@ Setup char-width-table appropriate for non-CJK language environment."
1170 (#x3130 #x318F hangul) 1206 (#x3130 #x318F hangul)
1171 (#x3190 #x319F kanbun) 1207 (#x3190 #x319F kanbun)
1172 (#x31A0 #x31BF bopomofo) 1208 (#x31A0 #x31BF bopomofo)
1173 (#x3400 #x9FAF han) 1209 (#x31C0 #x31EF cjk-misc)
1210 (#x31F0 #x31FF kana)
1211 (#x3200 #x9FAF han)
1174 (#xA000 #xA4CF yi) 1212 (#xA000 #xA4CF yi)
1213 (#xA4D0 #xA4FF lisu)
1214 (#xA500 #xA63F vai)
1215 (#xA640 #xA69F cyrillic)
1216 (#xA6A0 #xA6FF bamum)
1217 (#xA700 #xA7FF latin)
1218 (#xA800 #xA82F syloti-nagri)
1219 (#xA830 #xA83F north-indic-number)
1220 (#xA840 #xA87F phags-pa)
1221 (#xA880 #xA8DF saurashtra)
1222 (#xA8E0 #xA8FF devanagari)
1223 (#xA900 #xA92F kayah-li)
1224 (#xA930 #xA95F rejang)
1225 (#xA960 #xA97F hangul)
1226 (#xA980 #xA9DF javanese)
1175 (#xAA00 #xAA5F cham) 1227 (#xAA00 #xAA5F cham)
1176 (#xAA60 #xAA7B burmese) 1228 (#xAA60 #xAA7B burmese) ; Unicode 6.1: "myanmar"
1177 (#xAA80 #xAADF tai-viet) 1229 (#xAA80 #xAADF tai-viet)
1178 (#xAC00 #xD7AF hangul) 1230 (#xAAE0 #xAAFF meetei-mayek)
1231 (#xAB00 #xAB2F ethiopic)
1232 (#xABC0 #xABFF meetei-mayek)
1233 (#xAC00 #xD7FF hangul)
1179 (#xF900 #xFAFF han) 1234 (#xF900 #xFAFF han)
1180 (#xFB1D #xFB4F hebrew) 1235 (#xFB1D #xFB4F hebrew)
1181 (#xFB50 #xFDFF arabic) 1236 (#xFB50 #xFDFF arabic)
1182 (#xFE70 #xFEFC arabic) 1237 (#xFE30 #xFE4F han)
1238 (#xFE70 #xFEFF arabic)
1183 (#xFF00 #xFF5F cjk-misc) 1239 (#xFF00 #xFF5F cjk-misc)
1184 (#xFF61 #xFF9F kana) 1240 (#xFF61 #xFF9F kana)
1185 (#xFFE0 #xFFE6 cjk-misc) 1241 (#xFFE0 #xFFE6 cjk-misc)
1186 (#x10000 #x100FF linear-b) 1242 (#x10000 #x100FF linear-b)
1187 (#x10100 #x1013F aegean-number) 1243 (#x10100 #x1013F aegean-number)
1188 (#x10140 #x1018A ancient-greek-number) 1244 (#x10140 #x1018F ancient-greek-number)
1189 (#x10190 #x1019B ancient-symbol) 1245 (#x10190 #x101CF ancient-symbol)
1190 (#x101D0 #x101FF phaistos-disc) 1246 (#x101D0 #x101FF phaistos-disc)
1191 (#x10280 #x1029F lycian) 1247 (#x10280 #x1029F lycian)
1192 (#x102A0 #x102DF carian) 1248 (#x102A0 #x102DF carian)
1193 (#x10300 #x1032F olt-italic) 1249 (#x10300 #x1032F olt-italic)
1250 (#x10330 #x1034F gothic)
1194 (#x10380 #x1039F ugaritic) 1251 (#x10380 #x1039F ugaritic)
1195 (#x103A0 #x103DF old-persian) 1252 (#x103A0 #x103DF old-persian)
1196 (#x10400 #x1044F deseret) 1253 (#x10400 #x1044F deseret)
1197 (#x10450 #x1047F shavian) 1254 (#x10450 #x1047F shavian)
1198 (#x10480 #x104AF osmanya) 1255 (#x10480 #x104AF osmanya)
1199 (#x10800 #x1083F cypriot-syllabary) 1256 (#x10800 #x1083F cypriot-syllabary)
1257 (#x10840 #x1085F aramaic)
1200 (#x10900 #x1091F phoenician) 1258 (#x10900 #x1091F phoenician)
1201 (#x10920 #x1093F lydian) 1259 (#x10920 #x1093F lydian)
1260 (#x10980 #x109FF meroitic)
1202 (#x10A00 #x10A5F kharoshthi) 1261 (#x10A00 #x10A5F kharoshthi)
1262 (#x10A60 #x10A7F old-south-arabian)
1263 (#x10B00 #x10B3F avestan)
1264 (#x10B40 #x10B5F inscriptional-parthian)
1265 (#x10B60 #x10B7F inscriptional-pahlavi)
1266 (#x10C00 #x10C4F old-turkic)
1267 (#x10E60 #x10E7F rumi-number)
1268 (#x11000 #x1107F brahmi)
1269 (#x11080 #x110CF kaithi)
1270 (#x110D0 #x110FF sora-sompeng)
1271 (#x11100 #x1114F chakma)
1272 (#x11180 #x111DF sharada)
1273 (#x11680 #x116CF takri)
1203 (#x12000 #x123FF cuneiform) 1274 (#x12000 #x123FF cuneiform)
1204 (#x12400 #x1247F cuneiform-numbers-and-punctuation) 1275 (#x12400 #x1247F cuneiform-numbers-and-punctuation)
1276 (#x13000 #x1342F egyptian)
1277 (#x16800 #x16A3F bamum)
1278 (#x16F00 #x16F9F miao)
1279 (#x1B000 #x1B0FF kana)
1205 (#x1D000 #x1D0FF byzantine-musical-symbol) 1280 (#x1D000 #x1D0FF byzantine-musical-symbol)
1206 (#x1D100 #x1D1FF musical-symbol) 1281 (#x1D100 #x1D1FF musical-symbol)
1207 (#x1D200 #x1D24F ancient-greek-musical-notation) 1282 (#x1D200 #x1D24F ancient-greek-musical-notation)
1208 (#x1D300 #x1D35F tai-xuan-jing-symbol) 1283 (#x1D300 #x1D35F tai-xuan-jing-symbol)
1209 (#x1D360 #x1D37F counting-rod-numeral) 1284 (#x1D360 #x1D37F counting-rod-numeral)
1210 (#x1D400 #x1D7FF mathematical) 1285 (#x1D400 #x1D7FF mathematical)
1286 (#x1EE00 #x1EEFF arabic)
1211 (#x1F000 #x1F02F mahjong-tile) 1287 (#x1F000 #x1F02F mahjong-tile)
1212 (#x1F030 #x1F09F domino-tile) 1288 (#x1F030 #x1F09F domino-tile)
1213 (#x20000 #x2AFFF han) 1289 (#x1F0A0 #x1F0FF playing-cards)
1290 (#x1F100 #x1F1FF symbol)
1291 (#x1F200 #x1F2FF han)
1292 (#x1F300 #x1F64F symbol)
1293 (#x1F680 #x1F77F symbol)
1294 (#x20000 #x2B81F han)
1214 (#x2F800 #x2FFFF han))) 1295 (#x2F800 #x2FFFF han)))
1215 (set-char-table-range char-script-table 1296 (set-char-table-range char-script-table
1216 (cons (car elt) (nth 1 elt)) (nth 2 elt)) 1297 (cons (car elt) (nth 1 elt)) (nth 2 elt))