from whoosh import fields, index
import os.path
import csv
import codecs
# This list associates a name with each position in a row
columns = ["juza","chapter","verse","analysis"]
schema = fields.Schema(juza=fields.NUMERIC,
chapter=fields.NUMERIC,
verse=fields.NUMERIC,
analysis=fields.KEYWORD)
# Create the Whoosh index
indexname = "index"
if not os.path.exists(indexname):
os.mkdir(indexname)
ix = index.create_in(indexname, schema)
# Open a writer for the index
with ix.writer() as writer:
# Open the CSV file
with codecs.open("yom.csv", "rb","utf8") as csvfile:
for line in csvfile:
juza , chapter, verse , analysis = line.split(' ', 3)
doc = {k:v.strip() for k,v in zip(columns, analysis.split(':'))}
# Pass the dictionary to the add_document method
writer.add_document(**doc)
writer.commit()