scuffed-code/icu4c/source/test/testdata/testnorm.txt
2016-06-15 18:58:17 +00:00

82 lines
1.7 KiB
Plaintext

# Copyright (C) 2016 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html
# Copyright (C) 2010, International Business Machines
# Corporation and others. All Rights Reserved.
#
# file name: testnorm.txt
# encoding: US-ASCII
# tab size: 8 (not used)
# indentation:4
#
# created on: 2010feb15
# created by: Markus W. Scherer
#
# Normalization test data, for improving code coverage.
# Selection of Canonical_Combining_Class (ccc) values
0300..0314:230
0315:232
0316..0319:220
031A:232
031B:216
031C..0320:220
0321..0322:202
0323..0326:220
0327..0328:202
0329..0333:220
0334..0338:1
0339..033C:220
033D..0344:230
0345:240
0346:230
0347..0349:220
034A..034C:230
034D..034E:220
0350..0352:230
0353..0356:220
0357:230
0358:232
0359..035A:220
035B:230
035C:233
035D..035E:234
035F:233
0360..0361:234
0362:233
0363..036F:230
D802:2 # surrogates with non-zero combining classes
D803:3
D804:4
110B9:9
110BA:7
# Some interesting mappings
00C0=0041 0300
00C1=0041 0301
00C2=0041 0302
00C3=0041 0303
00C4=0041 0308
00C5=0041 030A
00C7=0043 0327
D800>D7FF # surrogates with mappings, and mappings to empty strings
D801>
DFFE>
DFFF>FFFF
E000>
E001=61 338 # composition with trail<=33FF and composite>7FFF
E002=E001 308 # recursive mapping needs reordering
E003>62 307 327 337 # mapping needs reordering
E011=E010 F0011 # composition of BMP+supplementary, and F0011 is maybe & combines-fwd
E111>1101 # mapping ends in Jamo L
E112>1102 62 # mapping starts with Jamo L
FFF3>FFF4
FFF4>FFF5
FFF5>FFF7
FFF7>10037
10036>FFF6
10077>10037
1109A=11099 110BA
1109C=1109B 110BA
110AB=110A5 110BA
F0010=F0011 E012 # composition of supplementary+BMP