1 // This file is part of ICU4X. For terms of use, please see the file
2 // called LICENSE at the top level of the ICU4X source tree
3 // (online at: https://github.com/unicode-org/icu4x/blob/main/LICENSE ).
4
5 use criterion::{black_box, criterion_group, criterion_main, Criterion};
6 use icu_casemap::CaseMapper;
7 use icu_locale_core::langid;
8 use icu_normalizer::DecomposingNormalizerBorrowed;
9
10 const TEST_STRING_EN: &str = "One of the key design principles of ICU4X is to make locale data small and portable, allowing it to be pulled from multiple sources depending on the needs of the application. This document explains how that goal can be achieved.";
11
12 // First 50 lines of the Iliad, in precomposed Greek
13 // (The Iliad is thousands of years old and public domain)
14 // Sources can be found in https://www.perseus.tufts.edu/hopper/text?doc=Perseus:text:1999.01.0133 or https://www.sacred-texts.com/cla/homer/greek/ili01.htm
15 const ILIAD: &str = include_str!("data/Iliad.txt");
16
overview_bench(c: &mut Criterion)17 fn overview_bench(c: &mut Criterion) {
18 let casemapper = CaseMapper::new();
19 let root = langid!("und");
20 let tr = langid!("tr");
21 c.bench_function("icu_casemap/overview", |b| {
22 b.iter(|| {
23 black_box(casemapper.lowercase_to_string(black_box(TEST_STRING_EN), &root));
24 black_box(casemapper.uppercase_to_string(black_box(TEST_STRING_EN), &root));
25 });
26 });
27
28 c.bench_function("icu_casemap/titlecase_segment", |b| {
29 b.iter(|| {
30 for s in TEST_STRING_EN.split(' ') {
31 black_box(casemapper.titlecase_segment_with_only_case_data_to_string(
32 black_box(s),
33 &root,
34 Default::default(),
35 ));
36 }
37 });
38 });
39
40 c.bench_function("icu_casemap/folding", |b| {
41 b.iter(|| {
42 black_box(casemapper.fold_string(black_box(TEST_STRING_EN)));
43 });
44 });
45 c.bench_function("icu_casemap/uppercase_tr", |b| {
46 b.iter(|| {
47 black_box(casemapper.uppercase_to_string(black_box(TEST_STRING_EN), &tr));
48 });
49 });
50 }
greek_uppercasing(_c: &mut Criterion)51 fn greek_uppercasing(_c: &mut Criterion) {
52 {
53 let c = _c;
54 let casemapper = CaseMapper::new();
55 let root = langid!("und");
56 let el = langid!("el");
57
58 let iliad_lowercase = casemapper.lowercase_to_string(ILIAD, &root);
59 let decomposer = DecomposingNormalizerBorrowed::new_nfd();
60 let nfd = decomposer.normalize_utf8(ILIAD.as_bytes());
61 let nfd_lowercase = decomposer.normalize_utf8(iliad_lowercase.as_bytes());
62
63 let mut group =
64 c.benchmark_group("icu_casemap/greek_uppercasing/precomposed/upper_from_title");
65 group.bench_function("root", |b| {
66 b.iter(|| {
67 black_box(casemapper.uppercase_to_string(black_box(ILIAD), &root));
68 });
69 });
70 group.bench_function("greek", |b| {
71 b.iter(|| {
72 black_box(casemapper.uppercase_to_string(black_box(ILIAD), &el));
73 });
74 });
75 group.finish();
76
77 let mut group =
78 c.benchmark_group("icu_casemap/greek_uppercasing/precomposed/upper_from_lower");
79 group.bench_function("root", |b| {
80 b.iter(|| {
81 black_box(casemapper.uppercase_to_string(black_box(&iliad_lowercase), &root));
82 });
83 });
84 group.bench_function("greek", |b| {
85 b.iter(|| {
86 black_box(casemapper.uppercase_to_string(black_box(&iliad_lowercase), &el));
87 });
88 });
89 group.finish();
90
91 let mut group =
92 c.benchmark_group("icu_casemap/greek_uppercasing/decomposed/upper_from_title");
93 group.bench_function("root", |b| {
94 b.iter(|| {
95 black_box(casemapper.uppercase_to_string(black_box(&nfd), &root));
96 });
97 });
98 group.bench_function("greek", |b| {
99 b.iter(|| {
100 black_box(casemapper.uppercase_to_string(black_box(&nfd), &el));
101 });
102 });
103 group.finish();
104
105 let mut group =
106 c.benchmark_group("icu_casemap/greek_uppercasing/decomposed/upper_from_lower");
107 group.bench_function("root", |b| {
108 b.iter(|| {
109 black_box(casemapper.uppercase_to_string(black_box(&nfd_lowercase), &root));
110 });
111 });
112 group.bench_function("greek", |b| {
113 b.iter(|| {
114 black_box(casemapper.uppercase_to_string(black_box(&nfd_lowercase), &el));
115 });
116 });
117 group.finish();
118 }
119 }
120 criterion_group!(benches, overview_bench, greek_uppercasing);
121 criterion_main!(benches);
122