aboutsummaryrefslogtreecommitdiffstats
path: root/web/utils.py
blob: e6f43096495cf31d7c5e25ca729a80d9db5b8565 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
import djvu_utils as du
import sys
import string_utils as su
from wikisource import get_page2


def gen_html(book, page_number):
    doc = du.get_document("../" + book)
    page = doc.pages[int(page_number) - 1]
    d = du.parse_page(page)
    elem, corrected_text = get_page2(open("test.txt").read())
    if d:
        orig_words, orig_coords = zip(*d)
        C = su.align(corrected_words, list(orig_words), list(orig_coords))
        corr_words = corrected_text.split()
        orig_coords_html = du.convert_to_htmlcoord(orig_coords, page.size[1])
    return orig_coords_html, orig_words, corr_words, C[1]

if __name__ == "__main__":
    gen_html(*sys.argv[1:3])