Home
last modified time | relevance | path

Searched refs:sentence (Results 1 – 25 of 119) sorted by relevance

12345

/external/libtextclassifier/lang_id/
Dlang-id.cc70 int GetRealTextSize(const LightSentence &sentence) { in GetRealTextSize() argument
72 for (int i = 0; i < sentence.num_words(); ++i) { in GetRealTextSize()
73 TC_DCHECK(!sentence.word(i).empty()); in GetRealTextSize()
74 TC_DCHECK_EQ('^', sentence.word(i).front()); in GetRealTextSize()
75 TC_DCHECK_EQ('$', sentence.word(i).back()); in GetRealTextSize()
76 total += sentence.word(i).size() - 2; in GetRealTextSize()
204 LightSentence sentence; in ScoreLanguages() local
205 TokenizeTextForLangId(text, &sentence); in ScoreLanguages()
207 if (GetRealTextSize(sentence) < min_text_size_in_bytes_) { in ScoreLanguages()
214 lang_id_brain_interface_.GetFeatures(&sentence, &features); in ScoreLanguages()
Dlanguage-identifier-features.cc47 const LightSentence &sentence) const { in ComputeNgramCounts()
61 for (int i = 0; i < sentence.num_words(); ++i) { in ComputeNgramCounts()
62 const std::string &word = sentence.word(i); in ComputeNgramCounts()
118 const LightSentence &sentence, in Evaluate() argument
121 int total_count = ComputeNgramCounts(sentence); in Evaluate()
Dlang-id-brain-interface.h62 void GetFeatures(LightSentence *sentence, in GetFeatures() argument
66 feature_extractor_.Preprocess(&workspace, sentence); in GetFeatures()
67 return feature_extractor_.ExtractFeatures(workspace, *sentence, features); in GetFeatures()
Drelevant-script-feature.cc41 const LightSentence &sentence, in Evaluate() argument
53 for (int i = 0; i < sentence.num_words(); ++i) { in Evaluate()
54 const std::string &word = sentence.word(i); in Evaluate()
Dlanguage-identifier-features.h48 void Evaluate(const WorkspaceSet &workspaces, const LightSentence &sentence,
57 int ComputeNgramCounts(const LightSentence &sentence) const;
Dcustom-tokenizer.cc55 void TokenizeTextForLangId(const std::string &text, LightSentence *sentence) { in TokenizeTextForLangId() argument
80 std::string *word = sentence->add_word(); in TokenizeTextForLangId()
Dcustom-tokenizer.h36 void TokenizeTextForLangId(const std::string &text, LightSentence *sentence);
Drelevant-script-feature.h47 void Evaluate(const WorkspaceSet &workspaces, const LightSentence &sentence,
/external/python/cpython2/Lib/test/cjkencodings/
Dhz-utf8.txt1 This sentence is in ASCII.
2 The next sentence is in GB.己所不欲,勿施於人。Bye.
Dhz.txt1 This sentence is in ASCII.
2 The next sentence is in GB.~{<:Ky2;S{#,NpJ)l6HK!#~}Bye.
/external/icu/icu4c/source/test/testdata/break_rules/
Dsentence.txt6 # file: sentence.txt
8 type = sentence; # one of grapheme | word | line | sentence
/external/icu/icu4c/source/test/cintltst/
Dcbiapts.c151 UBreakIterator *word, *sentence, *line, *character, *b, *bogus; in TestBreakIteratorCAPI() local
180 sentence = ubrk_open(UBRK_SENTENCE, "en_US", text, u_strlen(text), &status); in TestBreakIteratorCAPI()
309 ubrk_first(sentence); in TestBreakIteratorCAPI()
310 pos = ubrk_current(sentence); in TestBreakIteratorCAPI()
312 pos = ubrk_last(sentence); in TestBreakIteratorCAPI()
316 ubrk_first(sentence); in TestBreakIteratorCAPI()
317 to = ubrk_following( sentence, 0 ); in TestBreakIteratorCAPI()
319 to = ubrk_preceding( sentence, to ); in TestBreakIteratorCAPI()
321 if (ubrk_first(sentence)!=ubrk_current(sentence)) { in TestBreakIteratorCAPI()
363 ubrk_close(sentence); in TestBreakIteratorCAPI()
/external/icu/icu4j/demos/src/com/ibm/icu/dev/demo/translit/
DDemo.java699 String sentence = coreSentence.substring(oldPos, pos).trim(); in genTestFile() local
703 addSentenceToTable(out, sentence, in genTestFile()
770 static void addSentenceToTable(PrintWriter out, String sentence, in addSentenceToTable() argument
773 if (sentence.length() == 0) return; // skip empty lines in addSentenceToTable()
775 String originalShow = sentence; in addSentenceToTable()
777 latin = tl.transliterate(saveAscii.transliterate(sentence)); in addSentenceToTable()
790 String NFKDSentence = Normalizer.normalize(sentence, Normalizer.NFKD); in addSentenceToTable()
803 if (minLen > sentence.length()) minLen = sentence.length(); in addSentenceToTable()
806 if (reverse.charAt(i) != sentence.charAt(i)) break; in addSentenceToTable()
812 : showDifference(sentence, reverse); in addSentenceToTable()
[all …]
/external/mesa3d/docs/specs/
DMESA_multithread_makecurrent.spec66 Replace the following sentence from section 2.2 Rendering Contexts:
78 Replace the following sentence from section 3.3.7 Rendering Contexts:
85 Replace the following sentence from section 3.5 Rendering Contexts:
/external/icu/icu4c/source/data/brkitr/
Del.txt6 sentence:process(dependency){"sent_el.brk"}
Droot.txt11 sentence:process(dependency){"sent.brk"}
/external/snakeyaml/src/test/resources/pyyaml/
Dspec-08-10.data7 This sentence
Dspec-08-10.canonical11 : !!str "This sentence
/external/llvm/test/YAMLParser/
Dspec-08-10.test9 This sentence
/external/svox/pico/tests/data/
Dtests_regressions_es-ES.txt12 # TEST (old bug: burst of noise at end of sentence)
/external/python/cpython2/Doc/library/
Dtextwrap.rst167 sentence endings and ensure that sentences are always separated by exactly
169 However, the sentence detection algorithm is imperfect: it assumes that a
170 sentence ending consists of a lowercase letter followed by one of ``'.'``,
183 Since the sentence detection algorithm relies on ``string.lowercase`` for
/external/python/cpython2/Misc/
DREADME.Emacs29 sentence-end-double-space: t
/external/icu/icu4c/source/test/testdata/
Drbbitst.txt14 # <sent> any following data is for sentence break testing
411 <data>•Here is a random sentence, no ending period<100></data>
414 <data>• (This is it). •Testing the sentence iterator. •\
416 •This is a simple sample sentence. •(This is it.) •This is a simple sample sentence. •\
418 Hi! •This is a simple sample sentence. •It does not have to make any sense as you can see. •Nel mez…
455 # Breaks around '(' following a sentence TERM. (Rule 9)
493 # test for bug #4152117: Make sure sentence breaking is handling
500 # sentence breaks for hindi which used Devanagari script
501 # make sure there is sentence break after ?,danda(hindi phrase separator),
513 # Try a few more of the less common sentence endings.
[all …]
/external/icu/android_icu4j/src/main/tests/android/icu/dev/test/rbbi/
Drbbitst.txt14 # <sent> any following data is for sentence break testing
411 <data>•Here is a random sentence, no ending period<100></data>
414 <data>• (This is it). •Testing the sentence iterator. •\
416 •This is a simple sample sentence. •(This is it.) •This is a simple sample sentence. •\
418 Hi! •This is a simple sample sentence. •It does not have to make any sense as you can see. •Nel mez…
455 # Breaks around '(' following a sentence TERM. (Rule 9)
493 # test for bug #4152117: Make sure sentence breaking is handling
500 # sentence breaks for hindi which used Devanagari script
501 # make sure there is sentence break after ?,danda(hindi phrase separator),
513 # Try a few more of the less common sentence endings.
[all …]
/external/icu/icu4j/main/tests/core/src/com/ibm/icu/dev/test/rbbi/
Drbbitst.txt14 # <sent> any following data is for sentence break testing
411 <data>•Here is a random sentence, no ending period<100></data>
414 <data>• (This is it). •Testing the sentence iterator. •\
416 •This is a simple sample sentence. •(This is it.) •This is a simple sample sentence. •\
418 Hi! •This is a simple sample sentence. •It does not have to make any sense as you can see. •Nel mez…
455 # Breaks around '(' following a sentence TERM. (Rule 9)
493 # test for bug #4152117: Make sure sentence breaking is handling
500 # sentence breaks for hindi which used Devanagari script
501 # make sure there is sentence break after ?,danda(hindi phrase separator),
513 # Try a few more of the less common sentence endings.
[all …]

12345