|
@@ -7,10 +7,10 @@ def get_value(pair): |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def get_word(chunk): |
|
|
def get_word(chunk): |
|
|
if all(x.isalpha() for x in chunk): |
|
|
|
|
|
|
|
|
if all(x.isalpha() for x in chunk): # is_alpha() |
|
|
if len(chunk) < 4: |
|
|
if len(chunk) < 4: |
|
|
return None |
|
|
return None |
|
|
return chunk.lower() |
|
|
|
|
|
|
|
|
return chunk.lower() # lower() |
|
|
else: |
|
|
else: |
|
|
return None |
|
|
return None |
|
|
|
|
|
|
|
@@ -18,19 +18,28 @@ def get_word(chunk): |
|
|
def main(): |
|
|
def main(): |
|
|
filename = sys.argv[1] |
|
|
filename = sys.argv[1] |
|
|
file = open(filename, "r") |
|
|
file = open(filename, "r") |
|
|
|
|
|
lines = file.readlines() |
|
|
|
|
|
file.close() |
|
|
|
|
|
|
|
|
scores = {} |
|
|
scores = {} |
|
|
|
|
|
|
|
|
for line in file.readlines(): |
|
|
|
|
|
|
|
|
for line in lines: |
|
|
for chunk in line.split(): |
|
|
for chunk in line.split(): |
|
|
word = get_word(chunk) |
|
|
word = get_word(chunk) |
|
|
if word: |
|
|
if word: |
|
|
if not word in scores: |
|
|
if not word in scores: |
|
|
scores[word] = 0 |
|
|
|
|
|
|
|
|
scores[word] = 1 |
|
|
else: |
|
|
else: |
|
|
scores[word] += 1 |
|
|
scores[word] += 1 |
|
|
|
|
|
|
|
|
file.close() |
|
|
|
|
|
|
|
|
to_sort = [] |
|
|
|
|
|
for k in scores: # iterate on dicts |
|
|
|
|
|
v = scores[k] |
|
|
|
|
|
to_sort.append([v, k]) |
|
|
|
|
|
to_sort.sort() |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
print(to_sort[-10:]) |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
main() |
|
|
main() |