Module Name: src Committed By: rin Date: Mon Oct 17 11:20:30 UTC 2022
Modified Files: src/share/locale/ctype: en_US.UTF-8.src Log Message: Add "Emoji & Pictographs" character definitions from Unicode 15.0.0 (previously 10.0.0): http://www.unicode.org/charts/ They are classified as PUNCT, which has been used for characters other than blank, alphabetic, or digit ones. Glyph widths are taken from "East Asian Width": https://www.unicode.org/Public/15.0.0/ucd/EastAsianWidth.txt Characters of "F" or "W" are classified to SWIDTH2, and others are to SWIDTH1, as usual. See also: https://www.unicode.org/reports/tr11/ XXX It would be really nice if someone could check and update characters in categories other than Emoji... To generate a diff of this commit: cvs rdiff -u -r1.6 -r1.7 src/share/locale/ctype/en_US.UTF-8.src Please note that diffs are not public domain; they are subject to the copyright notices on the relevant files.
Modified files: Index: src/share/locale/ctype/en_US.UTF-8.src diff -u src/share/locale/ctype/en_US.UTF-8.src:1.6 src/share/locale/ctype/en_US.UTF-8.src:1.7 --- src/share/locale/ctype/en_US.UTF-8.src:1.6 Sun Jun 3 07:54:51 2018 +++ src/share/locale/ctype/en_US.UTF-8.src Mon Oct 17 11:20:29 2022 @@ -1,4 +1,4 @@ -/* $NetBSD: en_US.UTF-8.src,v 1.6 2018/06/03 07:54:51 rin Exp $ */ +/* $NetBSD: en_US.UTF-8.src,v 1.7 2022/10/17 11:20:29 rin Exp $ */ /* $FreeBSD: /repoman/r/ncvs/src/share/mklocale/UTF-8.src,v 1.1 2004/03/27 08:14:14 tjr Exp $ */ /* @@ -1848,10 +1848,16 @@ SWIDTH1 0x25a0 - 0x25ff * U+2600 - U+26FF : Miscellaneous Symbols */ -GRAPH 0x2600 - 0x2613 0x2616 0x2617 0x2619 - 0x267d 0x2680 - 0x2689 -PUNCT 0x2600 - 0x2613 0x2616 0x2617 0x2619 - 0x267d 0x2680 - 0x2689 -PRINT 0x2600 - 0x2613 0x2616 0x2617 0x2619 - 0x267d 0x2680 - 0x2689 -SWIDTH1 0x2600 - 0x2613 0x2616 0x2617 0x2619 - 0x267d 0x2680 - 0x2689 +GRAPH 0x2600 - 0x26ff +PUNCT 0x2600 - 0x26ff +PRINT 0x2600 - 0x26ff +SWIDTH1 0x2600 - 0x2613 0x2616 - 0x2647 0x2654 - 0x267e 0x2680 - 0x2692 +SWIDTH1 0x2694 - 0x26a0 0x26a2 - 0x26a9 0x26ac - 0x26bc 0x26bf - 0x26c3 +SWIDTH1 0x26c6 - 0x26cd 0x26cf - 0x26d3 0x26d5 - 0x26e9 0x26eb - 0x26f1 +SWIDTH1 0x26f4 0x26f6 - 0x26f9 0x26fb - 0x26fc 0x26fe - 0x26ff +SWIDTH2 0x2614 - 0x2615 0x2648 - 0x2653 0x267f 0x2693 0x26a1 +SWIDTH2 0x26aa - 0x26ab 0x26bd - 0x26be 0x26c4 - 0x26c5 0x26ce +SWIDTH2 0x26d4 0x26ea 0x26f2 - 0x26f3 0x26f5 0x26fa 0x26fd /* @@ -2435,28 +2441,39 @@ SWIDTH1 0x1f650 - 0x1f67f * U+1F680 - U+1F6FF : Transport and Map Symbols */ -GRAPH 0x1f680 - 0x1f6d4 0x1f6e0 - 0x1f6ec 0x1f6f0 - 0x1f6f8 -PUNCT 0x1f680 - 0x1f6d4 0x1f6e0 - 0x1f6ec 0x1f6f0 - 0x1f6f8 -PRINT 0x1f680 - 0x1f6d4 0x1f6e0 - 0x1f6ec 0x1f6f0 - 0x1f6f8 +GRAPH 0x1f680 - 0x1f6d7 0x1f6dc - 0x1f6ec 0x1f6f0 - 0x1f6fc +PUNCT 0x1f680 - 0x1f6d7 0x1f6dc - 0x1f6ec 0x1f6f0 - 0x1f6fc +PRINT 0x1f680 - 0x1f6d7 0x1f6dc - 0x1f6ec 0x1f6f0 - 0x1f6fc SWIDTH1 0x1f6c6 - 0x1f6cb 0x1f6cd - 0x1f6cf 0x1f6d3 - 0x1f6d4 SWIDTH1 0x1f6e0 - 0x1f6ea 0x1f6f0 - 0x1f6f3 -SWIDTH2 0x1f680 - 0x1f6c5 0x1f6cc 0x1f6d0 - 0x1f6d2 0x1f6eb - 0x1f6ec -SWIDTH2 0x1f6f4 - 0x1f6f8 +SWIDTH2 0x1f680 - 0x1f6c5 0x1f6cc 0x1f6d0 - 0x1f6d2 0x1f6d5 - 0x1f6d7 +SWIDTH2 0x1f6dc - 0x1f6df 0x1f6eb - 0x1f6ec 0x1f6f4 - 0x1f6fc /* * U+1F900 - U+1F9FF : Supplemental Symbols and Pictographs */ -GRAPH 0x1f900 - 0x1f90b 0x1f910 - 0x1f93e 0x1f940 - 0x1f94c -GRAPH 0x1f950 - 0x1f96b 0x1f980 - 0x1f997 0x1f9c0 0x1f9d0 - 0x1f9e6 -PUNCT 0x1f900 - 0x1f90b 0x1f910 - 0x1f93e 0x1f940 - 0x1f94c -PUNCT 0x1f950 - 0x1f96b 0x1f980 - 0x1f997 0x1f9c0 0x1f9d0 - 0x1f9e6 -PRINT 0x1f900 - 0x1f90b 0x1f910 - 0x1f93e 0x1f940 - 0x1f94c -PRINT 0x1f950 - 0x1f96b 0x1f980 - 0x1f997 0x1f9c0 0x1f9d0 - 0x1f9e6 -SWIDTH1 0x1f900 - 0x1f90b -SWIDTH2 0x1f910 - 0x1f93e 0x1f940 - 0x1f94c 0x1f950 - 0x1f96b -SWIDTH2 0x1f980 - 0x1f997 0x1f9c0 0x1f9d0 - 0x1f9e6 +GRAPH 0x1f900 - 0x1f9ff +PUNCT 0x1f900 - 0x1f9ff +PRINT 0x1f900 - 0x1f9ff +SWIDTH1 0x1f900 - 0x1f90b 0x1f93b 0x1f946 +SWIDTH2 0x1f90c - 0x1f93a 0x1f93c - 0x1f945 0x1f947 - 0x1f9ff + + +/* + * U+1FA70 - U+1FAFF : Symbols and Pictographs Extended-A + */ + +GRAPH 0x1fa70 - 0x1fa7c 0x1fa80 - 0x1fa88 0x1fa90 - 0x1fabd +GRAPH 0x1fabf - 0x1fac5 0x1face - 0x1fadb 0x1fae0 - 0x1fae8 +GRAPH 0x1faf0 - 0x1faf8 +PUNCT 0x1fa70 - 0x1fa7c 0x1fa80 - 0x1fa88 0x1fa90 - 0x1fabd +PUNCT 0x1fabf - 0x1fac5 0x1face - 0x1fadb 0x1fae0 - 0x1fae8 +PUNCT 0x1faf0 - 0x1faf8 +SWIDTH2 0x1fa70 - 0x1fa7c 0x1fa80 - 0x1fa88 0x1fa90 - 0x1fabd +SWIDTH2 0x1fabf - 0x1fac5 0x1face - 0x1fadb 0x1fae0 - 0x1fae8 +SWIDTH2 0x1faf0 - 0x1faf8 /*