New directory

author: Kenichi Handa 2003-09-08 11:56:09 +0000
committer: Kenichi Handa 2003-09-08 11:56:09 +0000
commit: 463f5630a5e7cbe7f042bc1175d1fa1c4e98860f (patch)
tree: 3287d0c628fea2249abf4635b3a4f45bedd6f8c4 /admin/charsets/compact.awk
parent: 4256310de631bd57c78b88b5131caa073315b3d7 (diff)
download: emacs-463f5630a5e7cbe7f042bc1175d1fa1c4e98860f.tar.gz
emacs-463f5630a5e7cbe7f042bc1175d1fa1c4e98860f.zip
1 files changed, 123 insertions, 0 deletions
diff --git a/admin/charsets/compact.awk b/admin/charsets/compact.awk
new file mode 100644
index 00000000000..281e51ebc3b
--- /dev/null
+++ b/admin/charsets/compact.awk
@@ -0,0 +1,123 @@
+# compact.awk -- Make charset map compact.
+# Copyright (C) 2003
+#   National Institute of Advanced Industrial Science and Technology (AIST)
+#   Registration Number H13PRO009
+#
+# This file is part of GNU Emacs.
+#
+# GNU Emacs is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2, or (at your option)
+# any later version.
+#
+# GNU Emacs is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with GNU Emacs; see the file COPYING.  If not, write to the
+# Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+# Boston, MA 02111-1307, USA.
+# Comment:
+# Make a charset map compact by changing this kind of line sequence:
+#   0x00 0x0000
+#   0x01 0x0001
+#   ...
+#   0x7F 0x007F
+# to one line of this format:
+#   0x00-0x7F 0x0000
+BEGIN {
+  tohex["0"] = 1;
+  tohex["1"] = 2;
+  tohex["2"] = 3;
+  tohex["3"] = 4;
+  tohex["4"] = 5;
+  tohex["5"] = 6;
+  tohex["6"] = 7;
+  tohex["7"] = 8;
+  tohex["8"] = 9;
+  tohex["9"] = 10;
+  tohex["A"] = 11;
+  tohex["B"] = 12;
+  tohex["C"] = 13;
+  tohex["D"] = 14;
+  tohex["E"] = 15;
+  tohex["F"] = 16;
+  tohex["a"] = 11;
+  tohex["b"] = 12;
+  tohex["c"] = 13;
+  tohex["d"] = 14;
+  tohex["e"] = 15;
+  tohex["f"] = 16;
+  from_code = 0;
+  to_code = -1;
+  to_unicode = 0;
+  from_unicode = 0;
+}
+function decode_hex(str, idx) {
+  n = 0;
+  len = length(str);
+  for (i = idx; i <= len; i++)
+    {
+      c = tohex[substr (str, i, 1)];
+      if (c == 0)
+        break;
+      n = n * 16 + c - 1;
+    }
+  return n;
+}
+/^\#/ {
+  print;
+  next;
+}
+{
+  code = decode_hex($1, 3);
+  unicode = decode_hex($2, 3);
+  if ((code == to_code + 1) && (unicode == to_unicode + 1))
+    {
+      to_code++;
+      to_unicode++;
+    }
+  else
+    {
+      if (to_code < 256)
+        {
+          if (from_code == to_code)
+            printf "0x%02X 0x%04X\n", from_code, from_unicode;
+          else if (from_code < to_code)
+            printf "0x%02X-0x%02X 0x%04X\n", from_code, to_code, from_unicode;
+        }
+      else
+        {
+          if (from_code == to_code)
+            printf "0x%04X 0x%04X\n", from_code, from_unicode;
+          else if (from_code < to_code)
+            printf "0x%04X-0x%04X 0x%04X\n", from_code, to_code, from_unicode;
+        }
+      from_code = to_code = code;
+      from_unicode = to_unicode = unicode;
+    }
+}
+END {
+  if (to_code < 256)
+    {
+      if (from_code == to_code)
+        printf "0x%02X 0x%04X\n", from_code, from_unicode;
+      else
+        printf "0x%02X-0x%02X 0x%04X\n", from_code, to_code, from_unicode;
+    }
+  else
+    {
+      if (from_code == to_code)
+        printf "0x%04X 0x%04X\n", from_code, from_unicode;
+      else
+        printf "0x%04X-0x%04X 0x%04X\n", from_code, to_code, from_unicode;
+    }
+}
author	Kenichi Handa	2003-09-08 11:56:09 +0000
committer	Kenichi Handa	2003-09-08 11:56:09 +0000
commit	463f5630a5e7cbe7f042bc1175d1fa1c4e98860f (patch)
tree	3287d0c628fea2249abf4635b3a4f45bedd6f8c4 /admin/charsets/compact.awk
parent	4256310de631bd57c78b88b5131caa073315b3d7 (diff)
download	emacs-463f5630a5e7cbe7f042bc1175d1fa1c4e98860f.tar.gz emacs-463f5630a5e7cbe7f042bc1175d1fa1c4e98860f.zip

diff --git a/admin/charsets/compact.awk b/admin/charsets/compact.awk new file mode 100644 index 00000000000..281e51ebc3b --- /dev/null +++ b/admin/charsets/compact.awk
@@ -0,0 +1,123 @@
	1	# compact.awk -- Make charset map compact.
	2	# Copyright (C) 2003
	3	# National Institute of Advanced Industrial Science and Technology (AIST)
	4	# Registration Number H13PRO009
	5	#
	6	# This file is part of GNU Emacs.
	7	#
	8	# GNU Emacs is free software; you can redistribute it and/or modify
	9	# it under the terms of the GNU General Public License as published by
	10	# the Free Software Foundation; either version 2, or (at your option)
	11	# any later version.
	12	#
	13	# GNU Emacs is distributed in the hope that it will be useful,
	14	# but WITHOUT ANY WARRANTY; without even the implied warranty of
	15	# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	16	# GNU General Public License for more details.
	17	#
	18	# You should have received a copy of the GNU General Public License
	19	# along with GNU Emacs; see the file COPYING. If not, write to the
	20	# Free Software Foundation, Inc., 59 Temple Place - Suite 330,
	21	# Boston, MA 02111-1307, USA.
	22
	23	# Comment:
	24	# Make a charset map compact by changing this kind of line sequence:
	25	# 0x00 0x0000
	26	# 0x01 0x0001
	27	# ...
	28	# 0x7F 0x007F
	29	# to one line of this format:
	30	# 0x00-0x7F 0x0000
	31
	32	BEGIN {
	33	tohex["0"] = 1;
	34	tohex["1"] = 2;
	35	tohex["2"] = 3;
	36	tohex["3"] = 4;
	37	tohex["4"] = 5;
	38	tohex["5"] = 6;
	39	tohex["6"] = 7;
	40	tohex["7"] = 8;
	41	tohex["8"] = 9;
	42	tohex["9"] = 10;
	43	tohex["A"] = 11;
	44	tohex["B"] = 12;
	45	tohex["C"] = 13;
	46	tohex["D"] = 14;
	47	tohex["E"] = 15;
	48	tohex["F"] = 16;
	49	tohex["a"] = 11;
	50	tohex["b"] = 12;
	51	tohex["c"] = 13;
	52	tohex["d"] = 14;
	53	tohex["e"] = 15;
	54	tohex["f"] = 16;
	55	from_code = 0;
	56	to_code = -1;
	57	to_unicode = 0;
	58	from_unicode = 0;
	59	}
	60
	61	function decode_hex(str, idx) {
	62	n = 0;
	63	len = length(str);
	64	for (i = idx; i <= len; i++)
	65	{
	66	c = tohex[substr (str, i, 1)];
	67	if (c == 0)
	68	break;
	69	n = n * 16 + c - 1;
	70	}
	71	return n;
	72	}
	73
	74	/^\#/ {
	75	print;
	76	next;
	77	}
	78
	79	{
	80	code = decode_hex($1, 3);
	81	unicode = decode_hex($2, 3);
	82	if ((code == to_code + 1) && (unicode == to_unicode + 1))
	83	{
	84	to_code++;
	85	to_unicode++;
	86	}
	87	else
	88	{
	89	if (to_code < 256)
	90	{
	91	if (from_code == to_code)
	92	printf "0x%02X 0x%04X\n", from_code, from_unicode;
	93	else if (from_code < to_code)
	94	printf "0x%02X-0x%02X 0x%04X\n", from_code, to_code, from_unicode;
	95	}
	96	else
	97	{
	98	if (from_code == to_code)
	99	printf "0x%04X 0x%04X\n", from_code, from_unicode;
	100	else if (from_code < to_code)
	101	printf "0x%04X-0x%04X 0x%04X\n", from_code, to_code, from_unicode;
	102	}
	103	from_code = to_code = code;
	104	from_unicode = to_unicode = unicode;
	105	}
	106	}
	107
	108	END {
	109	if (to_code < 256)
	110	{
	111	if (from_code == to_code)
	112	printf "0x%02X 0x%04X\n", from_code, from_unicode;
	113	else
	114	printf "0x%02X-0x%02X 0x%04X\n", from_code, to_code, from_unicode;
	115	}
	116	else
	117	{
	118	if (from_code == to_code)
	119	printf "0x%04X 0x%04X\n", from_code, from_unicode;
	120	else
	121	printf "0x%04X-0x%04X 0x%04X\n", from_code, to_code, from_unicode;
	122	}
	123	}