added ignored words

This commit is contained in:
Patrice Matz 2018-11-24 20:56:54 +01:00
parent 56195eeb25
commit edd27b63eb
2 changed files with 27 additions and 8 deletions

4
.gitignore vendored
View File

@ -1,2 +1,6 @@
\.vscode/
test\.txt
*.txt

View File

@ -1,6 +1,14 @@
import matplotlib.pyplot as plt
filtered = ["der", "die", "das", "ein", "eine", "einer", "es", "ist", "für", "im", "wird",
"auch", "mit", "aus", "von", "als", "in", "werden", "wurde", "oder", "auf", "wie", "den" ,
"zu", "dieser", "nicht", "sind", "des", "einen", "um", "können" , "nur", "diese", "wird",
"eines", "über", "hier", "dem", "so", "werde," ,"werde.", "werden." ,"dies", "muss", "alle",
"an" , "das", "der", "nach", "zum", "gibt", "da", "mehr", "dass", "gibt", "zum" ]
def main():
filename = "test.txt"
allWords = {}
@ -18,19 +26,26 @@ def main():
# x,y,z for ribbon Plot
wordArray = [] #x
indexes = [] #y
counts = [] #z
#indexes = [] #y
#counts = [] #z
for word in allWords:
if len(allWords[word]) > 10:
if len(allWords[word]) > 10 and word.lower() not in filtered:
tmpArray = []
for index in allWords[word]:
tmpArray.append(len(tmpArray))
counts.append(tmpArray)
indexes.append(allWords[word])
#counts.append(tmpArray)
#indexes.append(allWords[word])
wordArray.append(word)
plt.plot(allWords[word], tmpArray)
plt.scatter(allWords[word], tmpArray)
print(word, len(tmpArray))
#plt.yscale('log')
plt.legend(wordArray)
plt.show()