From 2d447ad45b70fd5727040be82e0f61626c2dde0b Mon Sep 17 00:00:00 2001 From: Gea-Suan Lin Date: Fri, 9 Feb 2024 14:33:07 +0800 Subject: [PATCH] Change TF from [id][term] to [term][id]. --- cmd/ir-tfidf/main.go | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/cmd/ir-tfidf/main.go b/cmd/ir-tfidf/main.go index 0a1ed64..8899b8e 100644 --- a/cmd/ir-tfidf/main.go +++ b/cmd/ir-tfidf/main.go @@ -21,12 +21,12 @@ func main() { bag := tokenizer.Tokenize(str) tokens[article.Id] = bag - // Init TF: - tf[article.Id] = make(map[string]int) - for _, w := range bag { // Handle TF: - tf[article.Id][w] = strings.Count(str, w) + if _, ok := tf[w]; !ok { + tf[w] = make(map[string]int) + } + tf[w][article.Id] += strings.Count(str, w) // Handle DF: df[w] += 1