You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
39 lines
972 B
Python
39 lines
972 B
Python
import sys
|
|
|
|
file = open(sys.argv[1], "r")
|
|
|
|
inputFile = file.read()
|
|
|
|
inputFile = inputFile.lower()
|
|
|
|
splitLine = inputFile.splitlines()
|
|
|
|
uniqueWords = set()
|
|
totalWords = 0
|
|
wordDict = {}
|
|
|
|
for line in splitLine:
|
|
line = line.replace(",", " ")
|
|
line = line.replace(".", " ")
|
|
line = line.replace("—", " ")
|
|
line = line.replace(":", " ")
|
|
line = line.replace(";", " ")
|
|
line = line.replace("!", " ")
|
|
line = line.replace("?", " ")
|
|
line = line.replace("/", " ")
|
|
line = line.replace("\\", " ")
|
|
wordList = line.split()
|
|
wordCount = 0
|
|
for word in wordList:
|
|
wordCount = wordCount + 1
|
|
uniqueWords.add(word)
|
|
if word in wordDict:
|
|
wordDict[word] = wordDict[word] + 1
|
|
else:
|
|
wordDict[word] = 1
|
|
totalWords = totalWords + wordCount
|
|
print("Total Words: " + str(totalWords))
|
|
print("Unique Words: " + str(len(uniqueWords)))
|
|
for word in wordDict:
|
|
print(word + " - " + str(wordDict[word]))
|