From 1e5b1dcf9ab90fec1dd71a51e87c484a5abd8c32 Mon Sep 17 00:00:00 2001 From: Gea-Suan Lin Date: Sun, 11 Feb 2024 14:32:09 +0800 Subject: [PATCH] Use os.Args[1] as query string, also lowercase all the time. --- cmd/ir-tfidf/main.go | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/cmd/ir-tfidf/main.go b/cmd/ir-tfidf/main.go index f4f42a2..d6d7cc7 100644 --- a/cmd/ir-tfidf/main.go +++ b/cmd/ir-tfidf/main.go @@ -18,7 +18,7 @@ func main() { df := make(map[string]int) for _, article := range articles { - str := article.Title + "\n" + article.Body + str := strings.ToLower(article.Title + "\n" + article.Body) bag := tokenizer.Tokenize(str) tokens[article.Id] = bag @@ -37,11 +37,12 @@ func main() { fmt.Println("TF & DF Built") - q := os.Args[1:] + q := strings.ToLower(os.Args[1]) + q_tokens := tokenizer.Tokenize(q) for _, article := range articles { var score float64 = 0.0 - for _, w := range q { + for _, w := range q_tokens { if tf[w] != nil { score += float64(tf[w][article.Id]) * math.Log2(float64(len(articles) / df[w])) }