This commit is contained in:
Patrice Matz 2018-11-18 09:24:34 +01:00
parent d2020dd394
commit eab21fbf85
3 changed files with 45 additions and 1 deletions

View File

@ -1 +1,3 @@
words-over-length
# Wordcount
Plots the use of words in a text over time.
![](Unbenannt.PNG)

BIN
Unbenannt.PNG Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 1.5 MiB

42
count.py Normal file
View File

@ -0,0 +1,42 @@
import matplotlib.pyplot as plt
import plotly.plotly as py
filePath = "./test.docx"
def main():
#print(getTxt(filePath))
filename = "test.txt"
allWords = {}
counter = 0
for line in open(filename, 'r'):
words = line.split(' ')
if '\n' in words:
words.remove("\n")
for word in words:
if word not in allWords:
allWords[word] = [counter]
else:
allWords[word].append(counter)
counter+=1
wordArray = [] #x
indexes = [] #y
counts = [] #z
for word in allWords:
if len(allWords[word]) > 10:
tmpArray = []
for index in allWords[word]:
tmpArray.append(len(tmpArray))
counts.append(tmpArray)
indexes.append(allWords[word])
plt.plot(allWords[word], tmpArray)
wordArray.append(word)
plt.legend(wordArray)
plt.show()
if __name__ == "__main__":
main()