aboutsummaryrefslogtreecommitdiffstats
path: root/lisp
diff options
context:
space:
mode:
authorEli Zaretskii2018-06-09 15:41:21 +0300
committerEli Zaretskii2018-06-09 15:41:21 +0300
commit36bbdfc017a6c37873cc0cb54bb966e3e3185012 (patch)
tree20d5d888bb81f70f838de1646561790a66865365 /lisp
parentb7b7a5f4f3b7e5e7cf830b2531ee48d0c58536ba (diff)
downloademacs-36bbdfc017a6c37873cc0cb54bb966e3e3185012.tar.gz
emacs-36bbdfc017a6c37873cc0cb54bb966e3e3185012.zip
Update Unicode data files to version 11.0.0 of Unicode
* admin/unidata/UnicodeData.txt: * admin/unidata/SpecialCasing.txt: * admin/unidata/NormalizationTest.txt: * admin/unidata/copyright.html: * admin/unidata/BidiMirroring.txt: * admin/unidata/BidiBrackets.txt: Import from Unicode 11.0. * admin/notes/unicode: Update the URL for OTF script tags. * lisp/international/mule-cmds.el (ucs-names): Update unused ranges. * lisp/international/fontset.el (script-representative-chars): Add hanifi-rohingya, old-sogdian, sogdian, dogra, gunjala-gondi, makasar, and medefaidrin. (otf-script-alist): Add old-hungarian. * lisp/international/characters.el (tbl): Add syntax entries for Supplemental Mathematical Operators, Miscellaneous Symbols and Arrows, and Supplemental Punctuation. Update the list of wide characters. * test/lisp/international/ucs-normalize-tests.el (ucs-normalize-tests--failing-lines-part2): Update to match admin/unidata/NormalizationTest.txt. * doc/lispref/nonascii.texi (Character Properties): Update the reference to the Unicode Standard. * doc/misc/efaq.texi (New in Emacs 26): * etc/NEWS: Mention compatibility with Unicode 11.0.
Diffstat (limited to 'lisp')
-rw-r--r--lisp/international/characters.el39
-rw-r--r--lisp/international/fontset.el10
-rw-r--r--lisp/international/mule-cmds.el2
3 files changed, 40 insertions, 11 deletions
diff --git a/lisp/international/characters.el b/lisp/international/characters.el
index 160de16eb57..23d9df686a5 100644
--- a/lisp/international/characters.el
+++ b/lisp/international/characters.el
@@ -643,12 +643,24 @@ with L, LRE, or LRO Unicode bidi character type.")
643 (setq c (1+ c))) 643 (setq c (1+ c)))
644 644
645 ;; Circled Latin 645 ;; Circled Latin
646 (setq c #x24b6) 646 (setq c #x24B6)
647 (while (<= c #x24cf) 647 (while (<= c #x24CF)
648 (modify-category-entry c ?l) 648 (modify-category-entry c ?l)
649 (modify-category-entry (+ c 26) ?l) 649 (modify-category-entry (+ c 26) ?l)
650 (setq c (1+ c))) 650 (setq c (1+ c)))
651 651
652 ;; Supplemental Mathematical Operators
653 (setq c #x2A00)
654 (while (<= c #x2AFF)
655 (set-case-syntax c "." tbl)
656 (setq c (1+ c)))
657
658 ;; Miscellaneous Symbols and Arrows
659 (setq c #x2B00)
660 (while (<= c #x2BFF)
661 (set-case-syntax c "." tbl)
662 (setq c (1+ c)))
663
652 ;; Coptic 664 ;; Coptic
653 ;; There's no Coptic category. However, Coptic letters that are 665 ;; There's no Coptic category. However, Coptic letters that are
654 ;; part of the Greek block above get the Greek category, and those 666 ;; part of the Greek block above get the Greek category, and those
@@ -656,6 +668,12 @@ with L, LRE, or LRO Unicode bidi character type.")
656 ;; consistent about their category. 668 ;; consistent about their category.
657 (modify-category-entry '(#x2C80 . #x2CFF) ?g) 669 (modify-category-entry '(#x2C80 . #x2CFF) ?g)
658 670
671 ;; Supplemental Punctuation
672 (setq c #x2E00)
673 (while (<= c #x2E7F)
674 (set-case-syntax c "." tbl)
675 (setq c (1+ c)))
676
659 ;; Fullwidth Latin 677 ;; Fullwidth Latin
660 (setq c #xff21) 678 (setq c #xff21)
661 (while (<= c #xff3a) 679 (while (<= c #xff3a)
@@ -1200,7 +1218,7 @@ with L, LRE, or LRO Unicode bidi character type.")
1200 (#xFF01 . #xFF60) 1218 (#xFF01 . #xFF60)
1201 (#xFFE0 . #xFFE6) 1219 (#xFFE0 . #xFFE6)
1202 (#x16FE0 . #x16FE1) 1220 (#x16FE0 . #x16FE1)
1203 (#x17000 . #x187EC) 1221 (#x17000 . #x187F1)
1204 (#x18800 . #x18AF2) 1222 (#x18800 . #x18AF2)
1205 (#x1B000 . #x1B11E) 1223 (#x1B000 . #x1B11E)
1206 (#x1B170 . #x1B2FB) 1224 (#x1B170 . #x1B2FB)
@@ -1233,13 +1251,16 @@ with L, LRE, or LRO Unicode bidi character type.")
1233 (#x1F6CC . #x1F6CC) 1251 (#x1F6CC . #x1F6CC)
1234 (#x1F6D0 . #x1F6D2) 1252 (#x1F6D0 . #x1F6D2)
1235 (#x1F6EB . #x1F6EC) 1253 (#x1F6EB . #x1F6EC)
1236 (#x1F6F4 . #x1F6F8) 1254 (#x1F6F4 . #x1F6F9)
1237 (#x1F910 . #x1F93E) 1255 (#x1F910 . #x1F93E)
1238 (#x1F940 . #x1F94C) 1256 (#x1F940 . #x1F970)
1239 (#x1F950 . #x1F96B) 1257 (#x1F973 . #x1F976)
1240 (#x1F980 . #x1F997) 1258 (#x1F97A . #x1F97A)
1241 (#x1F9C0 . #x1F9C0) 1259 (#x1F97C . #x1F9A2)
1242 (#x1F9D0 . #x1F9E6) 1260 (#x1F9B0 . #x1F9B9)
1261 (#x1F9C0 . #x1F9C2)
1262 (#x1F9D0 . #x1F9FF)
1263 (#x1FA60 . #x1FA6D)
1243 (#x20000 . #x2FFFF) 1264 (#x20000 . #x2FFFF)
1244 (#x30000 . #x3FFFF)))) 1265 (#x30000 . #x3FFFF))))
1245 (dolist (elt l) 1266 (dolist (elt l)
diff --git a/lisp/international/fontset.el b/lisp/international/fontset.el
index 5c0189b0155..23db54a4a3b 100644
--- a/lisp/international/fontset.el
+++ b/lisp/international/fontset.el
@@ -219,6 +219,9 @@
219 (lydian #x10920) 219 (lydian #x10920)
220 (kharoshthi #x10A00) 220 (kharoshthi #x10A00)
221 (manichaean #x10AC0) 221 (manichaean #x10AC0)
222 (hanifi-rohingya #x10D00)
223 (old-sogdian #x10F00)
224 (sogdian #x10F30)
222 (mahajani #x11150) 225 (mahajani #x11150)
223 (sinhala-archaic-number #x111E1) 226 (sinhala-archaic-number #x111E1)
224 (khojki #x11200) 227 (khojki #x11200)
@@ -229,6 +232,7 @@
229 (siddham #x11580) 232 (siddham #x11580)
230 (modi #x11600) 233 (modi #x11600)
231 (takri #x11680) 234 (takri #x11680)
235 (dogra #x11800)
232 (warang-citi #x118A1) 236 (warang-citi #x118A1)
233 (zanabazar-square #x11A00) 237 (zanabazar-square #x11A00)
234 (soyombo #x11A50) 238 (soyombo #x11A50)
@@ -236,11 +240,14 @@
236 (bhaiksuki #x11C00) 240 (bhaiksuki #x11C00)
237 (marchen #x11C72) 241 (marchen #x11C72)
238 (masaram-gondi #x11D00) 242 (masaram-gondi #x11D00)
243 (gunjala-gondi #x11D60)
244 (makasar #x11EE0)
239 (cuneiform #x12000) 245 (cuneiform #x12000)
240 (cuneiform-numbers-and-punctuation #x12400) 246 (cuneiform-numbers-and-punctuation #x12400)
241 (mro #x16A40) 247 (mro #x16A40)
242 (bassa-vah #x16AD0) 248 (bassa-vah #x16AD0)
243 (pahawh-hmong #x16B11) 249 (pahawh-hmong #x16B11)
250 (medefaidrin #x16E40)
244 (tangut #x17000) 251 (tangut #x17000)
245 (tangut-components #x18800) 252 (tangut-components #x18800)
246 (nushu #x1B170) 253 (nushu #x1B170)
@@ -257,7 +264,7 @@
257 264
258(defvar otf-script-alist) 265(defvar otf-script-alist)
259 266
260;; The below was synchronized with the latest Feb 25, 2016 version of 267;; The below was synchronized with the latest Jul 23, 2017 version of
261;; https://www.microsoft.com/typography/otspec/scripttags.htm. 268;; https://www.microsoft.com/typography/otspec/scripttags.htm.
262(setq otf-script-alist 269(setq otf-script-alist
263 '((adlm . adlam) 270 '((adlm . adlam)
@@ -312,6 +319,7 @@
312 (hano . hanunoo) 319 (hano . hanunoo)
313 (hatr . hatran) 320 (hatr . hatran)
314 (hebr . hebrew) 321 (hebr . hebrew)
322 (hung . old-hungarian)
315 (phli . inscriptional-pahlavi) 323 (phli . inscriptional-pahlavi)
316 (prti . inscriptional-parthian) 324 (prti . inscriptional-parthian)
317 (java . javanese) 325 (java . javanese)
diff --git a/lisp/international/mule-cmds.el b/lisp/international/mule-cmds.el
index aeba954a3b2..333fe2aa917 100644
--- a/lisp/international/mule-cmds.el
+++ b/lisp/international/mule-cmds.el
@@ -2934,7 +2934,7 @@ on encoding."
2934 (#x4DC0 . #x4DFF) 2934 (#x4DC0 . #x4DFF)
2935 ;; (#x4E00 . #x9FFF) CJK Unified Ideographs 2935 ;; (#x4E00 . #x9FFF) CJK Unified Ideographs
2936 (#xA000 . #xD7FF) 2936 (#xA000 . #xD7FF)
2937 ;; (#xD800 . #xFAFF) Surrogate/Private 2937 ;; (#xD800 . #xF8FF) Surrogate/Private
2938 (#xFB00 . #x134FF) 2938 (#xFB00 . #x134FF)
2939 ;; (#x13500 . #x143FF) unused 2939 ;; (#x13500 . #x143FF) unused
2940 (#x14400 . #x14646) 2940 (#x14400 . #x14646)