1
Fork 0
mirror of https://github.com/pds-nest/nest.git synced 2024-10-17 04:17:26 +00:00
pds-2021-g2-nest/nest_frontend/utils/countTweetWords.js

28 lines
636 B
JavaScript

import sw from "stopword"
const stopwords = [...sw.it, ...sw.en, "rt"]
export default function countTweetWords(tweets = []) {
let words = {}
for(const tweet of tweets) {
if(!tweet.content) {
continue
}
for(const word of tweet.content.toLowerCase().split(/\s+/)) {
if(stopwords.includes(word)) {
continue
}
if(word.startsWith("https://")) {
continue
}
if(!words.hasOwnProperty(word)) {
words[word] = 0
}
words[word] += 1
}
}
return words
}