• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright (C) 2021 Google LLC
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 //      http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 #ifndef ICING_TOKENIZATION_VERBATIM_H_
16 #define ICING_TOKENIZATION_VERBATIM_H_
17 
18 #include <memory>
19 #include <string_view>
20 #include <vector>
21 
22 #include "icing/text_classifier/lib3/utils/base/statusor.h"
23 #include "icing/tokenization/tokenizer.h"
24 
25 namespace icing {
26 namespace lib {
27 
28 // Provides verbatim tokenization on input text
29 class VerbatimTokenizer : public Tokenizer {
30  public:
31   libtextclassifier3::StatusOr<std::unique_ptr<Tokenizer::Iterator>> Tokenize(
32       std::string_view text) const override;
33 
34   libtextclassifier3::StatusOr<std::vector<Token>> TokenizeAll(
35       std::string_view text) const override;
36 };
37 
38 }  // namespace lib
39 }  // namespace icing
40 
41 #endif  // ICING_TOKENIZATION_VERBATIM_H_
42