// © 2019 and later: Unicode, Inc. and others. // License & terms of use: http://www.unicode.org/copyright.html #include #include #include #include #include #include #include "fuzzer_utils.h" #include "unicode/unistr.h" // Taken from third_party/icu/source/data/mappings/convrtrs.txt file. static const std::array kConverters = { { "UTF-8", "utf-16be", "utf-16le", "UTF-32", "UTF-32BE", "UTF-32LE", "ibm866-html", "iso-8859-2-html", "iso-8859-3-html", "iso-8859-4-html", "iso-8859-5-html", "iso-8859-6-html", "iso-8859-7-html", "iso-8859-8-html", "ISO-8859-8-I", "iso-8859-10-html", "iso-8859-13-html", "iso-8859-14-html", "iso-8859-15-html", "iso-8859-16-html", "koi8-r-html", "koi8-u-html", "macintosh-html", "windows-874-html", "windows-1250-html", "windows-1251-html", "windows-1252-html", "windows-1253-html", "windows-1254-html", "windows-1255-html", "windows-1256-html", "windows-1257-html", "windows-1258-html", "x-mac-cyrillic-html", "windows-936-2000", "gb18030", "big5-html", "euc-jp-html", "ISO_2022,locale=ja,version=0", "shift_jis-html", "euc-kr-html", "ISO-2022-KR", "ISO-2022-CN", "ISO-2022-CN-EXT", "HZ-GB-2312" } }; IcuEnvironment* env = new IcuEnvironment(); extern "C" int LLVMFuzzerTestOneInput(const uint8_t* data, size_t size) { if (size < 1) { return 0; } // First byte is used for random converter selection. uint8_t rnd = *data; data++; size--; std::unique_ptr fuzzbuff(new char[size]); std::memcpy(fuzzbuff.get(), data, size); icu::UnicodeString str(fuzzbuff.get(), size, kConverters[rnd % kConverters.size()]); return 0; }