1# Copyright (C) 2016 and later: Unicode, Inc. and others. 2# License & terms of use: http://www.unicode.org/copyright.html 3# Copyright (C) 2010, International Business Machines 4# Corporation and others. All Rights Reserved. 5# 6# file name: testnorm.txt 7# encoding: US-ASCII 8# tab size: 8 (not used) 9# indentation:4 10# 11# created on: 2010feb15 12# created by: Markus W. Scherer 13# 14# Normalization test data, for improving code coverage. 15 16# Selection of Canonical_Combining_Class (ccc) values 170300..0314:230 180315:232 190316..0319:220 20031A:232 21031B:216 22031C..0320:220 230321..0322:202 240323..0326:220 250327..0328:202 260329..0333:220 270334..0338:1 280339..033C:220 29033D..0344:230 300345:240 310346:230 320347..0349:220 33034A..034C:230 34034D..034E:220 350350..0352:230 360353..0356:220 370357:230 380358:232 390359..035A:220 40035B:230 41035C:233 42035D..035E:234 43035F:233 440360..0361:234 450362:233 460363..036F:230 47D802:2 # surrogates with non-zero combining classes 48D803:3 49D804:4 50110B9:9 51110BA:7 52 53# Some interesting mappings 5400C0=0041 0300 5500C1=0041 0301 5600C2=0041 0302 5700C3=0041 0303 5800C4=0041 0308 5900C5=0041 030A 6000C7=0043 0327 61D800>D7FF # surrogates with mappings, and mappings to empty strings 62D801> 63DFFE> 64DFFF>FFFF 65E000> 66E001=61 338 # composition with trail<=33FF and composite>7FFF 67E002=E001 308 # recursive mapping needs reordering 68E003>62 307 327 337 # mapping needs reordering 69E011=E010 F0011 # composition of BMP+supplementary, and F0011 is maybe & combines-fwd 70E111>1101 # mapping ends in Jamo L 71E112>1102 62 # mapping starts with Jamo L 72FFF3>FFF4 73FFF4>FFF5 74FFF5>FFF7 75FFF7>10037 7610036>FFF6 7710077>10037 781109A=11099 110BA 791109C=1109B 110BA 80110AB=110A5 110BA 81F0010=F0011 E012 # composition of supplementary+BMP 82