mirror of
https://github.com/pds-nest/nest.git
synced 2024-11-22 21:14:18 +00:00
28 lines
636 B
JavaScript
28 lines
636 B
JavaScript
import sw from "stopword"
|
|
|
|
|
|
const stopwords = [...sw.it, ...sw.en, "rt"]
|
|
|
|
|
|
export default function countTweetWords(tweets = {}) {
|
|
let words = {}
|
|
for(const tweet of tweets) {
|
|
if(!tweet.content) {
|
|
continue
|
|
}
|
|
for(const word of tweet.content.toLowerCase().split(/\s+/)) {
|
|
if(stopwords.includes(word)) {
|
|
continue
|
|
}
|
|
if(word.startsWith("https://")) {
|
|
continue
|
|
}
|
|
|
|
if(!words.hasOwnProperty(word)) {
|
|
words[word] = 0
|
|
}
|
|
words[word] += 1
|
|
}
|
|
}
|
|
return words
|
|
}
|