-
Notifications
You must be signed in to change notification settings - Fork 4
/
word_cloud.py
40 lines (31 loc) · 1.09 KB
/
word_cloud.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
#!/usr/bin/env python3
from wordcloud import WordCloud
from collections import Counter
import matplotlib.pyplot as plt
def open_file(path: str) -> str:
content = ""
with open(path, "r") as f:
content = f.readlines()
return " ".join(content)
all_words = ""
frase = open_file("texto.txt") # "hola a todos muchas palabras palabras hola muchas hola hola hola palabras palabras hola muchas hola hola hola palabras palabras hola muchas hola hola hola palabras palabras hola muchas hola hola hola"
palabras = frase.rstrip().split(" ")
# Counter(" ".join(palabras).split()).most_common(10)
# looping through all incidents and joining them to one text, to extract most common words
for arg in palabras:
tokens = arg.split()
all_words += " ".join(tokens) + " "
# print(all_words)
wordcloud = WordCloud(
background_color="white", min_font_size=5
).generate(all_words)
# print(all_words)
# plot the WordCloud image
plt.close()
plt.figure(figsize=(5, 5), facecolor=None)
plt.imshow(wordcloud)
plt.axis("off")
plt.tight_layout(pad=0)
# plt.show()
plt.savefig("img/word_cloud.png")
plt.close()