1 /*
2 * Copyright (C) 2018 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 #include "utils/codepoint-range.h"
18
19 #include <algorithm>
20
21 namespace libtextclassifier3 {
22
23 // Returns a sorted list of the codepoint ranges.
SortCodepointRanges(const std::vector<const CodepointRange * > & codepoint_ranges,std::vector<CodepointRangeStruct> * sorted_codepoint_ranges)24 void SortCodepointRanges(
25 const std::vector<const CodepointRange*>& codepoint_ranges,
26 std::vector<CodepointRangeStruct>* sorted_codepoint_ranges) {
27 sorted_codepoint_ranges->clear();
28 sorted_codepoint_ranges->reserve(codepoint_ranges.size());
29 for (const CodepointRange* range : codepoint_ranges) {
30 sorted_codepoint_ranges->push_back(
31 CodepointRangeStruct(range->start(), range->end()));
32 }
33
34 std::sort(sorted_codepoint_ranges->begin(), sorted_codepoint_ranges->end(),
35 [](const CodepointRangeStruct& a, const CodepointRangeStruct& b) {
36 return a.start < b.start;
37 });
38 }
39
40 // Returns true if given codepoint is covered by the given sorted vector of
41 // codepoint ranges.
IsCodepointInRanges(int codepoint,const std::vector<CodepointRangeStruct> & codepoint_ranges)42 bool IsCodepointInRanges(
43 int codepoint, const std::vector<CodepointRangeStruct>& codepoint_ranges) {
44 auto it = std::lower_bound(
45 codepoint_ranges.begin(), codepoint_ranges.end(), codepoint,
46 [](const CodepointRangeStruct& range, int codepoint) {
47 // This function compares range with the
48 // codepoint for the purpose of finding the first
49 // greater or equal range. Because of the use of
50 // std::lower_bound it needs to return true when
51 // range < codepoint; the first time it will
52 // return false the lower bound is found and
53 // returned.
54 //
55 // It might seem weird that the condition is
56 // range.end <= codepoint here but when codepoint
57 // == range.end it means it's actually just
58 // outside of the range, thus the range is less
59 // than the codepoint.
60 return range.end <= codepoint;
61 });
62 if (it != codepoint_ranges.end() && it->start <= codepoint &&
63 it->end > codepoint) {
64 return true;
65 } else {
66 return false;
67 }
68 }
69
70 } // namespace libtextclassifier3
71