// Copyright (C) 2019 Google LLC // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #ifndef ICING_TOKENIZATION_RAW_QUERY_TOKENIZER_H_ #define ICING_TOKENIZATION_RAW_QUERY_TOKENIZER_H_ #include #include #include #include "icing/text_classifier/lib3/utils/base/statusor.h" #include "icing/tokenization/language-segmenter.h" #include "icing/tokenization/token.h" #include "icing/tokenization/tokenizer.h" namespace icing { namespace lib { class RawQueryTokenizer : public Tokenizer { public: explicit RawQueryTokenizer(const LanguageSegmenter* language_segmenter) : language_segmenter_(*language_segmenter) {} libtextclassifier3::StatusOr> Tokenize( std::string_view text) const override; libtextclassifier3::StatusOr> TokenizeAll( std::string_view text) const override; private: // Used to segment input texts based on language understanding const LanguageSegmenter& language_segmenter_; }; } // namespace lib } // namespace icing #endif // ICING_TOKENIZATION_RAW_QUERY_TOKENIZER_H_