1//******************************************************************************* 2//* 3//* Copyright (C) 2002-2007, International Business Machines 4//* Corporation and others. All Rights Reserved. 5//* 6//******************************************************************************* 7 8casing:table(nofallback) { 9 Info { 10 Description { "This is test data file for string casing." } 11 12 LongDescription { 13 "each item is an array with\n" 14 "input string, result string, locale ID[, break iterator]\n" 15 "the break iterator (only for titlecasing) is specified as an int, same as in UBreakIteratorType:\n" 16 "0=UBRK_CHARACTER 1=UBRK_WORD 2=UBRK_LINE 3=UBRK_SENTENCE 4=UBRK_TITLE -1=default (NULL=words) -2=no breaks (.*)\n" 17 "options: T=U_FOLD_CASE_EXCLUDE_SPECIAL_I L=U_TITLECASE_NO_LOWERCASE A=U_TITLECASE_NO_BREAK_ADJUSTMENT\n" 18 } 19 } 20 TestData { 21 lowercasing { 22 Headers { "Input", "Output", "Locale" } 23 Cases { 24 { " tHe QUIcK bRoWn", " the quick brown", "" }, 25 { "aBIΣßΣ/", "abiσßς/", "" }, 26 { "aBIΣßΣ/", "abıσßς/", "tur" } // tur: 3-letter code for Turkish 27 } 28 } 29 uppercasing { 30 Headers { "Input", "Output", "Locale" } 31 Cases { 32 { " tHe QUIcK bRoWn", " THE QUICK BROWN", "" }, 33 { "aBiσßς/ffi", "ABIΣSSΣ/FFI", "" }, 34 { "aBiσßς/ffi", "ABİΣSSΣ/FFI", "az" } // az same casing as tr 35 } 36 } 37 titlecasing { 38 Headers { "Input", "Output", "Locale", "Type", "Options" } 39 Cases { 40 { "ʻaMeLikA huI Pū ʻʻʻiA", "ʻAmelika Hui Pū ʻʻʻIa", "", "-1", "" }, // titlecase first _cased_ letter, j4933 41 { " tHe QUIcK bRoWn", " The Quick Brown", "", "4", "" }, 42 { "DŽDždžLJLjljNJNjnj", "DžDžDžLjLjLjNjNjNj", "", "0", "" }, // UBRK_CHARACTER 43 { "ljubav ljubav", "Ljubav Ljubav", "", "-1", "" }, // Lj vs. L+j 44 { "'oH dOn'T tItLeCaSe AfTeR lEtTeR+'", "'Oh Don't Titlecase After Letter+'", "", "-1", "" }, 45 46 { "a ʻCaT. A ʻdOg! ʻeTc.", "A ʻCat. A ʻDog! ʻEtc.", "", "-1", "" }, // default 47 { "a ʻCaT. A ʻdOg! ʻeTc.", "A ʻcat. A ʻdog! ʻetc.", "", "-1", "A" }, // U_TITLECASE_NO_BREAK_ADJUSTMENT 48 { "a ʻCaT. A ʻdOg! ʻeTc.", "A ʻCaT. A ʻdOg! ʻETc.", "", "3", "L" }, // UBRK_SENTENCE and U_TITLECASE_NO_LOWERCASE 49 50 { "ʻcAt! ʻeTc.", "ʻCat! ʻetc.", "", "-2", "" }, // -2=Trivial break iterator 51 { "ʻcAt! ʻeTc.", "ʻcat! ʻetc.", "", "-2", "A" }, // U_TITLECASE_NO_BREAK_ADJUSTMENT 52 { "ʻcAt! ʻeTc.", "ʻCAt! ʻeTc.", "", "-2", "L" }, // U_TITLECASE_NO_LOWERCASE 53 { "ʻcAt! ʻeTc.", "ʻcAt! ʻeTc.", "", "-2", "AL" } // Both options 54 } 55 } 56 casefolding { 57 Headers { "Input", "Output", "Options" } 58 Cases { 59 { "aBİIıϐßffi", "abi̇iıβssffi", "" }, 60 { "aBİIıϐßffi", "abiııβssffi", "T" } // U_FOLD_CASE_EXCLUDE_SPECIAL_I 61 } 62 } 63 } 64} 65