Counting word frequency in a text with Python: Difference between revisions
(New page: Exercise to produce a "word cloud" based on frequency of words in a text.) |
m (Michael Murtaugh moved page WordFreq.cgi to Counting word frequency in a text with Python) |
||
(One intermediate revision by the same user not shown) | |||
Line 1: | Line 1: | ||
<source lang="python"> | |||
import string | |||
wd = {} | |||
# for every line, every word in line, add it to the dictionary | |||
for line in open("text.txt"): | |||
for word in line.split(): | |||
word = word.strip(string.punctuation).lower() | |||
# wd[word] = True | |||
wd[word] = wd.get(word, 0) + 1 # for word counting | |||
# get the dictionary keys, and alphabetize | |||
allwords = wd.keys() | |||
allwords.sort() | |||
for word in allwords: | |||
# print w | |||
print word, wd[word] | |||
</source> |
Latest revision as of 11:34, 11 March 2014
import string
wd = {}
# for every line, every word in line, add it to the dictionary
for line in open("text.txt"):
for word in line.split():
word = word.strip(string.punctuation).lower()
# wd[word] = True
wd[word] = wd.get(word, 0) + 1 # for word counting
# get the dictionary keys, and alphabetize
allwords = wd.keys()
allwords.sort()
for word in allwords:
# print w
print word, wd[word]