过滤空白字符
This commit is contained in:
parent
1c2237a66f
commit
fc16ab7c5d
|
@ -27,7 +27,7 @@ class AsyncWordCloudGenerator:
|
|||
|
||||
async def generate_word_frequency_and_cloud(self, data, save_words_prefix):
|
||||
all_text = ' '.join(item['content'] for item in data)
|
||||
words = [word for word in jieba.lcut(all_text) if word not in self.stop_words]
|
||||
words = [word for word in jieba.lcut(all_text) if word not in self.stop_words and len(word.strip()) > 0]
|
||||
word_freq = Counter(words)
|
||||
|
||||
# Save word frequency to file
|
||||
|
|
Loading…
Reference in New Issue