updated from Atlas
This commit is contained in:
28
03-dict-set/index0.py
Normal file
28
03-dict-set/index0.py
Normal file
@@ -0,0 +1,28 @@
|
||||
# adapted from Alex Martelli's example in "Re-learning Python"
|
||||
# http://www.aleax.it/Python/accu04_Relearn_Python_alex.pdf
|
||||
# (slide 41) Ex: lines-by-word file index
|
||||
|
||||
# BEGIN INDEX0
|
||||
"""Build an index mapping word -> list of occurrences"""
|
||||
|
||||
import sys
|
||||
import re
|
||||
|
||||
WORD_RE = re.compile('\w+')
|
||||
|
||||
index = {}
|
||||
with open(sys.argv[1], encoding='utf-8') as fp:
|
||||
for line_no, line in enumerate(fp, 1):
|
||||
for match in WORD_RE.finditer(line):
|
||||
word = match.group()
|
||||
column_no = match.start()+1
|
||||
location = (line_no, column_no)
|
||||
# this is ugly; coded like this to make a point
|
||||
occurrences = index.get(word, []) # <1>
|
||||
occurrences.append(location) # <2>
|
||||
index[word] = occurrences # <3>
|
||||
|
||||
# print in alphabetical order
|
||||
for word in sorted(index, key=str.upper): # <4>
|
||||
print(word, index[word])
|
||||
# END INDEX0
|
||||
Reference in New Issue
Block a user