Update Unicode data files to version 11.0.0 of Unicode

* admin/unidata/UnicodeData.txt: * admin/unidata/SpecialCasing.txt: * admin/unidata/NormalizationTest.txt: * admin/unidata/copyright.html: * admin/unidata/BidiMirroring.txt: * admin/unidata/BidiBrackets.txt: Import from Unicode 11.0. * admin/notes/unicode: Update the URL for OTF script tags. * lisp/international/mule-cmds.el (ucs-names): Update unused ranges. * lisp/international/fontset.el (script-representative-chars): Add hanifi-rohingya, old-sogdian, sogdian, dogra, gunjala-gondi, makasar, and medefaidrin. (otf-script-alist): Add old-hungarian. * lisp/international/characters.el (tbl): Add syntax entries for Supplemental Mathematical Operators, Miscellaneous Symbols and Arrows, and Supplemental Punctuation. Update the list of wide characters. * test/lisp/international/ucs-normalize-tests.el (ucs-normalize-tests--failing-lines-part2): Update to match admin/unidata/NormalizationTest.txt. * doc/lispref/nonascii.texi (Character Properties): Update the reference to the Unicode Standard. * doc/misc/efaq.texi (New in Emacs 26): * etc/NEWS: Mention compatibility with Unicode 11.0.
author: Eli Zaretskii 2018-06-09 15:41:21 +0300
committer: Eli Zaretskii 2018-06-09 15:41:21 +0300
commit: 36bbdfc017a6c37873cc0cb54bb966e3e3185012 (patch)
tree: 20d5d888bb81f70f838de1646561790a66865365 /lisp
parent: b7b7a5f4f3b7e5e7cf830b2531ee48d0c58536ba (diff)
download: emacs-36bbdfc017a6c37873cc0cb54bb966e3e3185012.tar.gz
emacs-36bbdfc017a6c37873cc0cb54bb966e3e3185012.zip
3 files changed, 40 insertions, 11 deletions
diff --git a/lisp/international/characters.el b/lisp/international/characters.el
index 160de16eb57..23d9df686a5 100644
--- a/lisp/international/characters.el
+++ b/lisp/international/characters.el
@@ -643,12 +643,24 @@ with L, LRE, or LRO Unicode bidi character type.")
    (setq c (1+ c)))
  ;; Circled Latin
-  (setq c #x24b6)
+  (setq c #x24B6)
-  (while (<= c #x24cf)
+  (while (<= c #x24CF)
    (modify-category-entry c ?l)
    (modify-category-entry (+ c 26) ?l)
    (setq c (1+ c)))
+  ;; Supplemental Mathematical Operators
+  (setq c #x2A00)
+  (while (<= c #x2AFF)
+    (set-case-syntax c "." tbl)
+    (setq c (1+ c)))
+  ;; Miscellaneous Symbols and Arrows
+  (setq c #x2B00)
+  (while (<= c #x2BFF)
+    (set-case-syntax c "." tbl)
+    (setq c (1+ c)))
  ;; Coptic
  ;; There's no Coptic category.  However, Coptic letters that are
  ;; part of the Greek block above get the Greek category, and those
@@ -656,6 +668,12 @@ with L, LRE, or LRO Unicode bidi character type.")
  ;; consistent about their category.
  (modify-category-entry '(#x2C80 . #x2CFF) ?g)
+  ;; Supplemental Punctuation
+  (setq c #x2E00)
+  (while (<= c #x2E7F)
+    (set-case-syntax c "." tbl)
+    (setq c (1+ c)))
  ;; Fullwidth Latin
  (setq c #xff21)
  (while (<= c #xff3a)
@@ -1200,7 +1218,7 @@ with L, LRE, or LRO Unicode bidi character type.")
           (#xFF01 . #xFF60)
           (#xFFE0 . #xFFE6)
           (#x16FE0 . #x16FE1)
-           (#x17000 . #x187EC)
+           (#x17000 . #x187F1)
           (#x18800 . #x18AF2)
           (#x1B000 . #x1B11E)
           (#x1B170 . #x1B2FB)
@@ -1233,13 +1251,16 @@ with L, LRE, or LRO Unicode bidi character type.")
           (#x1F6CC . #x1F6CC)
           (#x1F6D0 . #x1F6D2)
           (#x1F6EB . #x1F6EC)
-           (#x1F6F4 . #x1F6F8)
+           (#x1F6F4 . #x1F6F9)
           (#x1F910 . #x1F93E)
-           (#x1F940 . #x1F94C)
+           (#x1F940 . #x1F970)
-           (#x1F950 . #x1F96B)
+           (#x1F973 . #x1F976)
-           (#x1F980 . #x1F997)
+           (#x1F97A . #x1F97A)
-           (#x1F9C0 . #x1F9C0)
+           (#x1F97C . #x1F9A2)
-           (#x1F9D0 . #x1F9E6)
+           (#x1F9B0 . #x1F9B9)
+           (#x1F9C0 . #x1F9C2)
+           (#x1F9D0 . #x1F9FF)
+           (#x1FA60 . #x1FA6D)
           (#x20000 . #x2FFFF)
           (#x30000 . #x3FFFF))))
  (dolist (elt l)
diff --git a/lisp/international/fontset.el b/lisp/international/fontset.el
index 5c0189b0155..23db54a4a3b 100644
--- a/lisp/international/fontset.el
+++ b/lisp/international/fontset.el
@@ -219,6 +219,9 @@
        (lydian #x10920)
        (kharoshthi #x10A00)
        (manichaean #x10AC0)
+        (hanifi-rohingya #x10D00)
+        (old-sogdian #x10F00)
+        (sogdian #x10F30)
        (mahajani #x11150)
        (sinhala-archaic-number #x111E1)
        (khojki #x11200)
@@ -229,6 +232,7 @@
        (siddham #x11580)
        (modi #x11600)
        (takri #x11680)
+        (dogra #x11800)
        (warang-citi #x118A1)
        (zanabazar-square #x11A00)
        (soyombo #x11A50)
@@ -236,11 +240,14 @@
        (bhaiksuki #x11C00)
        (marchen #x11C72)
        (masaram-gondi #x11D00)
+        (gunjala-gondi #x11D60)
+        (makasar #x11EE0)
        (cuneiform #x12000)
        (cuneiform-numbers-and-punctuation #x12400)
        (mro #x16A40)
        (bassa-vah #x16AD0)
        (pahawh-hmong #x16B11)
+        (medefaidrin #x16E40)
        (tangut #x17000)
        (tangut-components #x18800)
        (nushu #x1B170)
@@ -257,7 +264,7 @@
 (defvar otf-script-alist)
-;; The below was synchronized with the latest Feb 25, 2016 version of
+;; The below was synchronized with the latest Jul 23, 2017 version of
 ;; https://www.microsoft.com/typography/otspec/scripttags.htm.
 (setq otf-script-alist
      '((adlm . adlam)
@@ -312,6 +319,7 @@
        (hano . hanunoo)
        (hatr . hatran)
        (hebr . hebrew)
+        (hung . old-hungarian)
        (phli . inscriptional-pahlavi)
        (prti . inscriptional-parthian)
        (java . javanese)
diff --git a/lisp/international/mule-cmds.el b/lisp/international/mule-cmds.el
index aeba954a3b2..333fe2aa917 100644
--- a/lisp/international/mule-cmds.el
+++ b/lisp/international/mule-cmds.el
@@ -2934,7 +2934,7 @@ on encoding."
               (#x4DC0 . #x4DFF)
               ;; (#x4E00 . #x9FFF) CJK Unified Ideographs
               (#xA000 . #xD7FF)
-               ;; (#xD800 . #xFAFF) Surrogate/Private
+               ;; (#xD800 . #xF8FF) Surrogate/Private
               (#xFB00 . #x134FF)
               ;; (#x13500 . #x143FF) unused
               (#x14400 . #x14646)
author	Eli Zaretskii	2018-06-09 15:41:21 +0300
committer	Eli Zaretskii	2018-06-09 15:41:21 +0300
commit	36bbdfc017a6c37873cc0cb54bb966e3e3185012 (patch)
tree	20d5d888bb81f70f838de1646561790a66865365 /lisp
parent	b7b7a5f4f3b7e5e7cf830b2531ee48d0c58536ba (diff)
download	emacs-36bbdfc017a6c37873cc0cb54bb966e3e3185012.tar.gz emacs-36bbdfc017a6c37873cc0cb54bb966e3e3185012.zip