python-stuff/wordcount.py

39 lines
972 B
Python

import sys
file = open(sys.argv[1], "r")
inputFile = file.read()
inputFile = inputFile.lower()
splitLine = inputFile.splitlines()
uniqueWords = set()
totalWords = 0
wordDict = {}
for line in splitLine:
line = line.replace(",", " ")
line = line.replace(".", " ")
line = line.replace("", " ")
line = line.replace(":", " ")
line = line.replace(";", " ")
line = line.replace("!", " ")
line = line.replace("?", " ")
line = line.replace("/", " ")
line = line.replace("\\", " ")
wordList = line.split()
wordCount = 0
for word in wordList:
wordCount = wordCount + 1
uniqueWords.add(word)
if word in wordDict:
wordDict[word] = wordDict[word] + 1
else:
wordDict[word] = 1
totalWords = totalWords + wordCount
print("Total Words: " + str(totalWords))
print("Unique Words: " + str(len(uniqueWords)))
for word in wordDict:
print(word + " - " + str(wordDict[word]))