blob: 583cd1cf7559f1099924a5640eabe2f2eba7e8f8 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
|
from parsedjvutext import parse_book
import sys
def gen_html(book, page_number):
book = "../Villiers_de_L\'Isle-Adam_-_Tribulat_Bonhomet,_1908.djvu"
d = parse_book(book, page=int(page_number), html=True)
coords, words = d["coords"][0], d["words"][0]
def get_areas():
for i, coord in enumerate(coords):
coord_str = ",".join(map(str, coord))
yield i, coord_str
return list(get_areas()), list(enumerate(words))
if __name__ == "__main__":
gen_html(*sys.argv[1:3])
|