You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
84 lines
1.8 KiB
84 lines
1.8 KiB
# Copyright (C) 2016 and later: Unicode, Inc. and others.
|
|
# License & terms of use: http://www.unicode.org/copyright.html
|
|
# Copyright (C) 2010, International Business Machines
|
|
# Corporation and others. All Rights Reserved.
|
|
#
|
|
# file name: testnorm.txt
|
|
# encoding: US-ASCII
|
|
# tab size: 8 (not used)
|
|
# indentation:4
|
|
#
|
|
# created on: 2010feb15
|
|
# created by: Markus W. Scherer
|
|
#
|
|
# Normalization test data, for improving code coverage.
|
|
|
|
# Selection of Canonical_Combining_Class (ccc) values
|
|
0300..0314:230
|
|
0315:232
|
|
0316..0319:220
|
|
031A:232
|
|
031B:216
|
|
031C..0320:220
|
|
0321..0322:202
|
|
0323..0326:220
|
|
0327..0328:202
|
|
0329..0333:220
|
|
0334..0338:1
|
|
0339..033C:220
|
|
033D..0344:230
|
|
0345:240
|
|
0346:230
|
|
0347..0349:220
|
|
034A..034C:230
|
|
034D..034E:220
|
|
0350..0352:230
|
|
0353..0356:220
|
|
0357:230
|
|
0358:232
|
|
0359..035A:220
|
|
035B:230
|
|
035C:233
|
|
035D..035E:234
|
|
035F:233
|
|
0360..0361:234
|
|
0362:233
|
|
0363..036F:230
|
|
# ICU 63 normalization with UCPTrie requires inert surrogate code points.
|
|
# D802:2 # surrogates with non-zero combining classes
|
|
# D803:3
|
|
# D804:4
|
|
110B9:9
|
|
110BA:7
|
|
|
|
# Some interesting mappings
|
|
00C0=0041 0300
|
|
00C1=0041 0301
|
|
00C2=0041 0302
|
|
00C3=0041 0303
|
|
00C4=0041 0308
|
|
00C5=0041 030A
|
|
00C7=0043 0327
|
|
# ICU 63 normalization with UCPTrie requires inert surrogate code points.
|
|
# D800>D7FF # surrogates with mappings, and mappings to empty strings
|
|
# D801>
|
|
# DFFE>
|
|
# DFFF>FFFF
|
|
E000>
|
|
E001=61 338 # composition with trail<=33FF and composite>7FFF
|
|
E002=E001 308 # recursive mapping needs reordering
|
|
E003>62 307 327 337 # mapping needs reordering
|
|
E011=E010 F0011 # composition of BMP+supplementary, and F0011 is maybe & combines-fwd
|
|
E111>1101 # mapping ends in Jamo L
|
|
E112>1102 62 # mapping starts with Jamo L
|
|
FFF3>FFF4
|
|
FFF4>FFF5
|
|
FFF5>FFF7
|
|
FFF7>10037
|
|
10036>FFF6
|
|
10077>10037
|
|
1109A=11099 110BA
|
|
1109C=1109B 110BA
|
|
110AB=110A5 110BA
|
|
F0010=F0011 E012 # composition of supplementary+BMP
|