Simple keyword extraction
go install github.com/next-lucasmenende/interpretext-keyword-extraction
If you want to extend stopword list, create a file, named as language code, into a any folder (for example: en
file will contain English stopwords). Then, set env var STOPWORDS
to that folder path.
Extended stopword lists can be found in Stopwords ISO profile.
package main
import (
"fmt"
tokenizer "github.com/next-lucasmenendez/interpretext-tokenizer"
keywords "github.com/next-lucasmenendez/interpretext-keyword-extractor"
)
func main() {
var limit int = 15
var lang string = "<input-lang>"
var text string = "<input-text>"
var words [][]string
for _, s := range tokenizer.Sentences(text) {
words = append(words, tokenizer.Words(s))
}
if tags, err := keywords.GetTags(words, lang, limit); err != nil {
fmt.Println(err)
} else {
fmt.Printf("%q\n", tags)
}
}