from ox.text import findRe import json import codecs def do(): f = codecs.open("ChronoArr_Srt.txt", mode="r", encoding="utf-8") data = json.loads(open("radia.json").read()) txt = f.read() tapes = txt.split("***") indexHtml = u'' counter = 0 for t in tapes: if counter >= len(data): break meta = data[counter] padmaId = meta['hid'] audioFile = meta['name'] + u'.wav' fullTxt = t.strip() titleReg = r'Title: (.*?)\n' timeReg = r'Time: (.*?)\n' time = findRe(fullTxt, timeReg) outfile = "tapes/%d.html" % (counter,) title = findRe(fullTxt, titleReg) print title indexHtml += "%s
Time: %s
\n" % (outfile, title, time,) indexHtml += "View on Padma
\n" % (padmaId,) audioHtml = "

\n\n" % (audioFile,) print audioHtml indexHtml += audioHtml out = codecs.open(outfile, mode="w", encoding="utf-8") out.write("

%s

" % (audioFile, fullTxt,)) out.close() counter += 1 indexFile = codecs.open("index.html", mode="w", encoding="utf-8") indexFile.write(indexHtml) indexFile.close() f.close()