aboutsummaryrefslogtreecommitdiffstats
path: root/web/utils.py
blob: 583cd1cf7559f1099924a5640eabe2f2eba7e8f8 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
from parsedjvutext import parse_book
import sys


def gen_html(book, page_number):
    book = "../Villiers_de_L\'Isle-Adam_-_Tribulat_Bonhomet,_1908.djvu"
    d = parse_book(book, page=int(page_number), html=True)
    coords, words = d["coords"][0], d["words"][0]

    def get_areas():
        for i, coord in enumerate(coords):
            coord_str = ",".join(map(str, coord))
            yield i, coord_str

    return list(get_areas()), list(enumerate(words))

if __name__ == "__main__":
    gen_html(*sys.argv[1:3])