summaryrefslogtreecommitdiff
path: root/vendor/github.com/DavidBelicza/TextRank/v2/convert/builder.go
blob: db94cfc52fe4e56c57ad115b2d00008679dab6c0 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
package convert

import (
	"github.com/DavidBelicza/TextRank/v2/parse"
	"github.com/DavidBelicza/TextRank/v2/rank"
)

// TextToRank function converts a ParsedSentence object to Rank object, it is
// the preparing process to later text ranking.
func TextToRank(sentence parse.ParsedSentence, lang Language, ranks *rank.Rank) {
	sentenceId := addSentence(ranks, sentence)
	addWord(ranks, sentence.GetWords(), lang, sentenceId)
}

func addWord(ranks *rank.Rank, words []string, lang Language, sentenceID int) {
	prevWordID := -1
	var curWordID int

	for _, word := range words {
		if !lang.IsStopWord(word) {
			if found, rootWord := lang.FindRootWord(word); found {
				word = rootWord
			}

			if !ranks.IsWordExist(word) {
				curWordID = ranks.AddNewWord(word, prevWordID, sentenceID)
			} else {
				curWordID = ranks.UpdateWord(word, prevWordID, sentenceID)
			}

			ranks.Relation.AddRelation(curWordID, prevWordID, sentenceID)
			ranks.UpdateRightConnection(prevWordID, curWordID)

			prevWordID = curWordID
		}
	}
}

func addSentence(ranks *rank.Rank, sentence parse.ParsedSentence) int {
	ranks.SentenceMap[len(ranks.SentenceMap)] = sentence.GetOriginal()

	return len(ranks.SentenceMap) - 1
}