diff --git a/tools/words.py b/tools/words.py index d9f0a8c..3ca0778 100644 --- a/tools/words.py +++ b/tools/words.py @@ -27,7 +27,7 @@ class AsyncWordCloudGenerator: async def generate_word_frequency_and_cloud(self, data, save_words_prefix): all_text = ' '.join(item['content'] for item in data) - words = [word for word in jieba.lcut(all_text) if word not in self.stop_words] + words = [word for word in jieba.lcut(all_text) if word not in self.stop_words and len(word.strip()) > 0] word_freq = Counter(words) # Save word frequency to file