Home
last modified time | relevance | path

Searched defs:indexedDocument (Results 1 – 6 of 6) sorted by relevance

/external/licenseclassifier/v2/
Ddocument.go39 type indexedDocument struct { struct
40 Norm string // The normalized token sequence
41 Tokens []indexedToken // ordered tokens of the document
42 …// these are matches identified while processing the original, untokenized text via regexp matching
43 f *frequencyTable // frequencies computed for this document
44 dict *dictionary // The corpus dictionary for this document
45 s *searchSet // The searchset for this document
46 runes []rune
49 func (d *indexedDocument) generateSearchSet(q int) {
53 func (d *indexedDocument) size() int {
[all …]
Ddiff.go48 func docDiff(id string, doc1 *indexedDocument, doc1Start, doc1End int, doc2 *indexedDocument, doc2S…
60 func diffWordsToRunes(doc *indexedDocument, start, end int) []rune {
Dfrequencies.go41 func (d *indexedDocument) tokenSimilarity(o *indexedDocument) float64 {
Dscoring.go36 func (c *Classifier) score(id string, unknown, known *indexedDocument, unknownStart, unknownEnd int…
Dtokenizer.go240 func appendToDoc(doc *indexedDocument, dict *dictionary, line int, in []tokenID, ld *dictionary, no…
Dsearchset.go58 func newSearchSet(s *indexedDocument, q int) *searchSet {