from ox.text import findRe import json import codecs def JSONtoHTML(): data = json.loads(open("radia.json").read()) html = '' counter = 1 for d in data: html += '
\n' % (d['name'], d['hid'],) html += '
%d> %s
\n' % (counter, d['title'],) html += '
%s
\n' % (d['dt-time'],) html += "
\n\n" counter += 1 indexFile = codecs.open("index.html", mode="w", encoding="utf-8") header = open("header.html").read() footer = open("footer.html").read() indexFile.write(header) indexFile.write(html) indexFile.write(footer) indexFile.close() def do(): f = codecs.open("ChronoArr_Srt.txt", mode="r", encoding="utf-8") data = json.loads(open("radia.json").read()) txt = f.read() tapes = txt.split("***") indexHtml = u'' counter = 0 for t in tapes: if counter >= len(data): break meta = data[counter] padmaId = meta['hid'] audioFile = meta['name'] + u'.wav' fullTxt = t.strip() titleReg = r'Title: (.*?)\n' timeReg = r'Time: (.*?)\n' time = findRe(fullTxt, timeReg) outfile = "tapes/%d.html" % (counter,) title = findRe(fullTxt, titleReg) print title indexHtml += "%s
Time: %s
\n" % (outfile, title, time,) indexHtml += "View on Padma
\n" % (padmaId,) # audioHtml = "

\n\n" % (audioFile,) print audioHtml indexHtml += audioHtml out = codecs.open(outfile, mode="w", encoding="utf-8") out.write("

%s
" % (audioFile, fullTxt,)) out.close() counter += 1 indexFile = codecs.open("index.html", mode="w", encoding="utf-8") header = open("header.html").read() footer = open("footer.html").read() indexFile.write(header) indexFile.write(indexHtml) indexFile.write(footer) indexFile.close() f.close()