Source-Changes-HG archive
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]
[src/trunk]: src/share/locale/ctype Update unicode tables.
details: https://anonhg.NetBSD.org/src/rev/79ac991e5591
branches: trunk
changeset: 372694:79ac991e5591
user: wiz <wiz%NetBSD.org@localhost>
date: Tue Dec 20 23:06:08 2022 +0000
description:
Update unicode tables.
This version of the file, and the generator script, come from
OpenBSD. The script was written by Andrew Fresh.
The file covers the encodings from Unicode 13.0.0, based on the files
distributed with perl 5.32.1.
diffstat:
share/locale/ctype/en_US.UTF-8.src | 5407 +++++++++++++++++++++++++++++----
share/locale/ctype/gen_ctype_utf8.pl | 447 ++
2 files changed, 5129 insertions(+), 725 deletions(-)
diffs (truncated from 6794 to 300 lines):
diff -r f700d5207534 -r 79ac991e5591 share/locale/ctype/en_US.UTF-8.src
--- a/share/locale/ctype/en_US.UTF-8.src Tue Dec 20 17:51:54 2022 +0000
+++ b/share/locale/ctype/en_US.UTF-8.src Tue Dec 20 23:06:08 2022 +0000
@@ -1,44 +1,47 @@
-/* $NetBSD: en_US.UTF-8.src,v 1.7 2022/10/17 11:20:29 rin Exp $ */
-/* $FreeBSD: /repoman/r/ncvs/src/share/mklocale/UTF-8.src,v 1.1 2004/03/27 08:14:14 tjr Exp $ */
-
-/*
- * UTF-8 locale table for Rune Locale
+/* $NetBSD: en_US.UTF-8.src,v 1.8 2022/12/20 23:06:08 wiz Exp $ */
+/* $OpenBSD: en_US.UTF-8.src,v 1.12 2021/05/16 22:48:05 afresh1 Exp $ */
+
+/*
+ * COPYRIGHT AND PERMISSION NOTICE
*
- * Generated by Hye-Shik Chang <perky%FreeBSD.org@localhost>
- */
-
-/*
- * UCD(Unicode Character Database) Terms of Use
- *
- * Disclaimer
+ * Copyright (c) 1991-2021 Unicode, Inc. All rights reserved.
+ * Distributed under the Terms of Use in
+ * https://www.unicode.org/copyright.html.
*
- * The Unicode Character Database is provided as is by Unicode, Inc. No claims
- * are made as to fitness for any particular purpose. No warranties of any kind
- * are expressed or implied. The recipient agrees to determine applicability of
- * information provided. If this file has been purchased on magnetic or optical
- * media from Unicode, Inc., the sole remedy for any claim will be exchange of
- * defective media within 90 days of receipt.
- *
- * This disclaimer is applicable for all other data files accompanying the
- * Unicode Character Database, some of which have been compiled by the Unicode
- * Consortium, and some of which have been supplied by other sources.
+ * Permission is hereby granted, free of charge, to any person obtaining
+ * a copy of the Unicode data files and any associated documentation
+ * (the "Data Files") or Unicode software and any associated documentation
+ * (the "Software") to deal in the Data Files or Software
+ * without restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, and/or sell copies of
+ * the Data Files or Software, and to permit persons to whom the Data Files
+ * or Software are furnished to do so, provided that either
+ * (a) this copyright and permission notice appear with all copies
+ * of the Data Files or Software, or
+ * (b) this copyright and permission notice appear in associated
+ * Documentation.
*
- * Limitations on Rights to Redistribute This Data
+ * THE DATA FILES AND SOFTWARE ARE PROVIDED "AS IS", WITHOUT WARRANTY OF
+ * ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
+ * WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT OF THIRD PARTY RIGHTS.
+ * IN NO EVENT SHALL THE COPYRIGHT HOLDER OR HOLDERS INCLUDED IN THIS
+ * NOTICE BE LIABLE FOR ANY CLAIM, OR ANY SPECIAL INDIRECT OR CONSEQUENTIAL
+ * DAMAGES, OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE,
+ * DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
+ * TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
+ * PERFORMANCE OF THE DATA FILES OR SOFTWARE.
*
- * Recipient is granted the right to make copies in any form for internal
- * distribution and to freely use the information supplied in the creation of
- * products supporting the UnicodeTM Standard. The files in the Unicode
- * Character Database can be redistributed to third parties or other
- * organizations (whether for profit or not) as long as this notice and the
- * disclaimer notice are retained. Information can be extracted from these
- * files and used in documentation or programs, as long as there is an
- * accompanying notice indicating the source.
- *
+ * Except as contained in this notice, the name of a copyright holder
+ * shall not be used in advertising or otherwise to promote the sale,
+ * use or other dealings in these Data Files or Software without prior
+ * written authorization of the copyright holder.
*/
ENCODING "UTF8"
VARIABLE CODESET=UTF-8
+/* Unicode Version 13.0.0 */
/*
* U+0000 - U+007F : Basic Latin
@@ -53,15 +56,15 @@
SPACE 0x0009 - 0x000d 0x0020
UPPER 'A' - 'Z'
XDIGIT '0' - '9' 'A' - 'F' 'a' - 'f'
-BLANK 0x0009 0x000b 0x0020
+BLANK 0x0009 0x000b - 0x000c 0x0020
PRINT 0x0020 - 0x007e
SWIDTH1 0x0020 - 0x007e
MAPUPPER < 'a' - 'z' : 'A' >
MAPLOWER < 'A' - 'Z' : 'a' >
TODIGIT < '0' - '9' : 0x0000 >
-TODIGIT < 'A' - 'F' : 10 > < 'a' - 'f' : 10 >
-
+TODIGIT < 'A' - 'F' : 10 >
+TODIGIT < 'a' - 'f' : 10 >
/*
* U+0080 - U+00FF : Latin-1 Supplement
@@ -69,17 +72,18 @@
ALPHA 0x00aa 0x00b5 0x00ba 0x00c0 - 0x00d6 0x00d8 - 0x00f6
ALPHA 0x00f8 - 0x00ff
-CONTROL 0x0080 - 0x009f
+CONTROL 0x0080 - 0x009f 0x00ad
GRAPH 0x00a1 - 0x00ff
-LOWER 0x00aa 0x00b5 0x00ba 0x00df - 0x00f6 0x00f8 - 0x00ff
-PUNCT 0x00a1 - 0x00a9 0x00ab - 0x00b1 0x00b4 0x00b6 - 0x00b8
-PUNCT 0x00bb 0x00bf 0x00d7 0x00f7
+LOWER 0x00b5 0x00df - 0x00f6 0x00f8 - 0x00ff
+PUNCT 0x00a1 - 0x00a9 0x00ab - 0x00ac 0x00ae - 0x00b1 0x00b4
+PUNCT 0x00b6 - 0x00b8 0x00bb 0x00bf 0x00d7 0x00f7
SPACE 0x0085 0x00a0
UPPER 0x00c0 - 0x00d6 0x00d8 - 0x00de
BLANK 0x00a0
PRINT 0x00a0 - 0x00ff
-SPECIAL 0x00b2 0x00b3 0x00b9 0x00bc - 0x00be
-SWIDTH1 0x00a0 - 0x00ff
+SPECIAL 0x00b2 - 0x00b3 0x00b9 0x00bc - 0x00be
+SWIDTH0 0x00ad
+SWIDTH1 0x00a0 - 0x00ac 0x00ae - 0x00ff
MAPUPPER < 0x00b5 0x039c >
MAPUPPER < 0x00e0 - 0x00f6 : 0x00c0 >
@@ -87,9 +91,8 @@
MAPUPPER < 0x00ff 0x0178 >
MAPLOWER < 0x00c0 - 0x00d6 : 0x00e0 >
MAPLOWER < 0x00d8 - 0x00de : 0x00f8 >
-TODIGIT < 0x00b2 - 0x00b3 : 0x0002 >
-TODIGIT < 0x00b9 0x0001 >
-
+TODIGIT < 0x00b2 - 0x00b3 : 2 >
+TODIGIT < 0x00b9 1 >
/*
* U+0100 - U+017F : Latin Extended-A
@@ -97,24 +100,22 @@
ALPHA 0x0100 - 0x017f
GRAPH 0x0100 - 0x017f
-LOWER 0x0101 0x0103 0x0105 0x0107 0x0109 0x010b 0x010d
-LOWER 0x010f 0x0111 0x0113 0x0115 0x0117 0x0119 0x011b
-LOWER 0x011d 0x011f 0x0121 0x0123 0x0125 0x0127 0x0129
-LOWER 0x012b 0x012d 0x012f 0x0131 0x0133 0x0135 0x0137 0x0138
-LOWER 0x013a 0x013c 0x013e 0x0140 0x0142 0x0144 0x0146
-LOWER 0x0148 0x0149 0x014b 0x014d 0x014f 0x0151 0x0153
-LOWER 0x0155 0x0157 0x0159 0x015b 0x015d 0x015f 0x0161
-LOWER 0x0163 0x0165 0x0167 0x0169 0x016b 0x016d 0x016f
-LOWER 0x0171 0x0173 0x0175 0x0177 0x017a 0x017c 0x017e 0x017f
-UPPER 0x0100 0x0102 0x0104 0x0106 0x0108 0x010a 0x010c
-UPPER 0x010e 0x0110 0x0112 0x0114 0x0116 0x0118 0x011a
-UPPER 0x011c 0x011e 0x0120 0x0122 0x0124 0x0126 0x0128
-UPPER 0x012a 0x012c 0x012e 0x0130 0x0132 0x0134 0x0136
-UPPER 0x0139 0x013b 0x013d 0x013f 0x0141 0x0143 0x0145
-UPPER 0x0147 0x014a 0x014c 0x014e 0x0150 0x0152 0x0154
-UPPER 0x0156 0x0158 0x015a 0x015c 0x015e 0x0160 0x0162
-UPPER 0x0164 0x0166 0x0168 0x016a 0x016c 0x016e 0x0170
-UPPER 0x0172 0x0174 0x0176 0x0178 0x0179 0x017b 0x017d
+LOWER 0x0101 0x0103 0x0105 0x0107 0x0109 0x010b 0x010d 0x010f 0x0111
+LOWER 0x0113 0x0115 0x0117 0x0119 0x011b 0x011d 0x011f 0x0121 0x0123
+LOWER 0x0125 0x0127 0x0129 0x012b 0x012d 0x012f 0x0131 0x0133 0x0135
+LOWER 0x0137 - 0x0138 0x013a 0x013c 0x013e 0x0140 0x0142 0x0144
+LOWER 0x0146 0x0148 - 0x0149 0x014b 0x014d 0x014f 0x0151 0x0153
+LOWER 0x0155 0x0157 0x0159 0x015b 0x015d 0x015f 0x0161 0x0163 0x0165
+LOWER 0x0167 0x0169 0x016b 0x016d 0x016f 0x0171 0x0173 0x0175 0x0177
+LOWER 0x017a 0x017c 0x017e - 0x017f
+UPPER 0x0100 0x0102 0x0104 0x0106 0x0108 0x010a 0x010c 0x010e 0x0110
+UPPER 0x0112 0x0114 0x0116 0x0118 0x011a 0x011c 0x011e 0x0120 0x0122
+UPPER 0x0124 0x0126 0x0128 0x012a 0x012c 0x012e 0x0130 0x0132 0x0134
+UPPER 0x0136 0x0139 0x013b 0x013d 0x013f 0x0141 0x0143 0x0145 0x0147
+UPPER 0x014a 0x014c 0x014e 0x0150 0x0152 0x0154 0x0156 0x0158 0x015a
+UPPER 0x015c 0x015e 0x0160 0x0162 0x0164 0x0166 0x0168 0x016a 0x016c
+UPPER 0x016e 0x0170 0x0172 0x0174 0x0176 0x0178 - 0x0179 0x017b
+UPPER 0x017d
PRINT 0x0100 - 0x017f
SWIDTH1 0x0100 - 0x017f
@@ -245,40 +246,39 @@
MAPLOWER < 0x017b 0x017c >
MAPLOWER < 0x017d 0x017e >
-
/*
* U+0180 - U+024F : Latin Extended-B
*/
-ALPHA 0x0180 - 0x01ba 0x01bc - 0x01bf 0x01c4 - 0x0220 0x0222 - 0x0233
-GRAPH 0x0180 - 0x0220 0x0222 - 0x0233
-LOWER 0x0180 0x0183 0x0185 0x0188 0x018c 0x018d 0x0192
-LOWER 0x0195 0x0199 - 0x019b 0x019e 0x01a1 0x01a3 0x01a5
-LOWER 0x01a8 0x01aa 0x01ab 0x01ad 0x01b0 0x01b4 0x01b6
-LOWER 0x01b9 0x01ba 0x01bd - 0x01bf 0x01c6 0x01c9 0x01cc
-LOWER 0x01ce 0x01d0 0x01d2 0x01d4 0x01d6 0x01d8 0x01da
-LOWER 0x01dc 0x01dd 0x01df 0x01e1 0x01e3 0x01e5 0x01e7
-LOWER 0x01e9 0x01eb 0x01ed 0x01ef 0x01f0 0x01f3 0x01f5
-LOWER 0x01f9 0x01fb 0x01fd 0x01ff 0x0201 0x0203 0x0205
-LOWER 0x0207 0x0209 0x020b 0x020d 0x020f 0x0211 0x0213
-LOWER 0x0215 0x0217 0x0219 0x021b 0x021d 0x021f 0x0223
-LOWER 0x0225 0x0227 0x0229 0x022b 0x022d 0x022f 0x0231
-LOWER 0x0233
-UPPER 0x0181 0x0182 0x0184 0x0186 0x0187 0x0189 - 0x018b
-UPPER 0x018e - 0x0191 0x0193 0x0194 0x0196 - 0x0198 0x019c 0x019d
-UPPER 0x019f 0x01a0 0x01a2 0x01a4 0x01a6 0x01a7 0x01a9
-UPPER 0x01ac 0x01ae 0x01af 0x01b1 - 0x01b3 0x01b5 0x01b7 0x01b8
-UPPER 0x01bc 0x01c4 0x01c7 0x01ca 0x01cd 0x01cf 0x01d1
-UPPER 0x01d3 0x01d5 0x01d7 0x01d9 0x01db 0x01de 0x01e0
-UPPER 0x01e2 0x01e4 0x01e6 0x01e8 0x01ea 0x01ec 0x01ee
-UPPER 0x01f1 0x01f4 0x01f6 - 0x01f8 0x01fa 0x01fc 0x01fe
-UPPER 0x0200 0x0202 0x0204 0x0206 0x0208 0x020a 0x020c
-UPPER 0x020e 0x0210 0x0212 0x0214 0x0216 0x0218 0x021a
-UPPER 0x021c 0x021e 0x0220 0x0222 0x0224 0x0226 0x0228
-UPPER 0x022a 0x022c 0x022e 0x0230 0x0232
-PRINT 0x0180 - 0x0220 0x0222 - 0x0233
-SWIDTH1 0x0180 - 0x0220 0x0222 - 0x0233
-
+ALPHA 0x0180 - 0x024f
+GRAPH 0x0180 - 0x024f
+LOWER 0x0180 0x0183 0x0185 0x0188 0x018c - 0x018d 0x0192 0x0195
+LOWER 0x0199 - 0x019b 0x019e 0x01a1 0x01a3 0x01a5 0x01a8
+LOWER 0x01aa - 0x01ab 0x01ad 0x01b0 0x01b4 0x01b6 0x01b9 - 0x01ba
+LOWER 0x01bd - 0x01bf 0x01c6 0x01c9 0x01cc 0x01ce 0x01d0 0x01d2
+LOWER 0x01d4 0x01d6 0x01d8 0x01da 0x01dc - 0x01dd 0x01df 0x01e1
+LOWER 0x01e3 0x01e5 0x01e7 0x01e9 0x01eb 0x01ed 0x01ef - 0x01f0
+LOWER 0x01f3 0x01f5 0x01f9 0x01fb 0x01fd 0x01ff 0x0201 0x0203 0x0205
+LOWER 0x0207 0x0209 0x020b 0x020d 0x020f 0x0211 0x0213 0x0215 0x0217
+LOWER 0x0219 0x021b 0x021d 0x021f 0x0221 0x0223 0x0225 0x0227 0x0229
+LOWER 0x022b 0x022d 0x022f 0x0231 0x0233 - 0x0239 0x023c
+LOWER 0x023f - 0x0240 0x0242 0x0247 0x0249 0x024b 0x024d 0x024f
+UPPER 0x0181 - 0x0182 0x0184 0x0186 - 0x0187 0x0189 - 0x018b
+UPPER 0x018e - 0x0191 0x0193 - 0x0194 0x0196 - 0x0198 0x019c - 0x019d
+UPPER 0x019f - 0x01a0 0x01a2 0x01a4 0x01a6 - 0x01a7 0x01a9 0x01ac
+UPPER 0x01ae - 0x01af 0x01b1 - 0x01b3 0x01b5 0x01b7 - 0x01b8 0x01bc
+UPPER 0x01c4 0x01c7 0x01ca 0x01cd 0x01cf 0x01d1 0x01d3 0x01d5 0x01d7
+UPPER 0x01d9 0x01db 0x01de 0x01e0 0x01e2 0x01e4 0x01e6 0x01e8 0x01ea
+UPPER 0x01ec 0x01ee 0x01f1 0x01f4 0x01f6 - 0x01f8 0x01fa 0x01fc
+UPPER 0x01fe 0x0200 0x0202 0x0204 0x0206 0x0208 0x020a 0x020c 0x020e
+UPPER 0x0210 0x0212 0x0214 0x0216 0x0218 0x021a 0x021c 0x021e 0x0220
+UPPER 0x0222 0x0224 0x0226 0x0228 0x022a 0x022c 0x022e 0x0230 0x0232
+UPPER 0x023a - 0x023b 0x023d - 0x023e 0x0241 0x0243 - 0x0246 0x0248
+UPPER 0x024a 0x024c 0x024e
+PRINT 0x0180 - 0x024f
+SWIDTH1 0x0180 - 0x024f
+
+MAPUPPER < 0x0180 0x0243 >
MAPUPPER < 0x0183 0x0182 >
MAPUPPER < 0x0185 0x0184 >
MAPUPPER < 0x0188 0x0187 >
@@ -286,6 +286,7 @@
MAPUPPER < 0x0192 0x0191 >
MAPUPPER < 0x0195 0x01f6 >
MAPUPPER < 0x0199 0x0198 >
+MAPUPPER < 0x019a 0x023d >
MAPUPPER < 0x019e 0x0220 >
MAPUPPER < 0x01a1 0x01a0 >
MAPUPPER < 0x01a3 0x01a2 >
@@ -298,11 +299,8 @@
MAPUPPER < 0x01b9 0x01b8 >
MAPUPPER < 0x01bd 0x01bc >
MAPUPPER < 0x01bf 0x01f7 >
-MAPUPPER < 0x01c5 0x01c4 >
MAPUPPER < 0x01c6 0x01c4 >
-MAPUPPER < 0x01c8 0x01c7 >
MAPUPPER < 0x01c9 0x01c7 >
-MAPUPPER < 0x01cb 0x01ca >
MAPUPPER < 0x01cc 0x01ca >
MAPUPPER < 0x01ce 0x01cd >
MAPUPPER < 0x01d0 0x01cf >
@@ -322,7 +320,6 @@
MAPUPPER < 0x01eb 0x01ea >
MAPUPPER < 0x01ed 0x01ec >
MAPUPPER < 0x01ef 0x01ee >
-MAPUPPER < 0x01f2 0x01f1 >
MAPUPPER < 0x01f3 0x01f1 >
MAPUPPER < 0x01f5 0x01f4 >
MAPUPPER < 0x01f9 0x01f8 >
@@ -354,6 +351,14 @@
MAPUPPER < 0x022f 0x022e >
MAPUPPER < 0x0231 0x0230 >
MAPUPPER < 0x0233 0x0232 >
+MAPUPPER < 0x023c 0x023b >
+MAPUPPER < 0x023f - 0x0240 : 0x2c7e >
+MAPUPPER < 0x0242 0x0241 >
+MAPUPPER < 0x0247 0x0246 >
+MAPUPPER < 0x0249 0x0248 >
+MAPUPPER < 0x024b 0x024a >
+MAPUPPER < 0x024d 0x024c >
+MAPUPPER < 0x024f 0x024e >
MAPLOWER < 0x0181 0x0253 >
MAPLOWER < 0x0182 0x0183 >
MAPLOWER < 0x0184 0x0185 >
@@ -389,11 +394,8 @@
MAPLOWER < 0x01b8 0x01b9 >
MAPLOWER < 0x01bc 0x01bd >
MAPLOWER < 0x01c4 0x01c6 >
-MAPLOWER < 0x01c5 0x01c6 >
MAPLOWER < 0x01c7 0x01c9 >
-MAPLOWER < 0x01c8 0x01c9 >
Home |
Main Index |
Thread Index |
Old Index