-
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathexample.py
58 lines (46 loc) · 1.83 KB
/
example.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
import os
import sys
from time import time
start_time = time()
from ztml import validation, ztml
books = [30123, 2600]
book_mtf = [0, 80]
book_ect = [False, True]
output_folder = 'output'
skip_download_exists = True
element_id = ''
assert len(books) == len(book_mtf) == len(book_ect)
error = False
for item, mtf, ect in zip(books, book_mtf, book_ect):
item_start_time = time()
filenames = dict(raw=f'{item}.txt',
# base64_js=f'{item}_64.js',
base64_html=f'{item}_64.html',
# base125_js=f'{item}_125.js',
base125_html=f'{item}_125.html',
# crenc_js=f'{item}_cr.js',
crenc_html=f'{item}_cr.html')
os.makedirs(output_folder, exist_ok=True)
filenames = {k: os.path.join(output_folder, v) for k, v in filenames.items()}
# If missing, download an example file from the web
if not skip_download_exists or not os.path.exists(filenames['raw']):
from gutenbergpy.textget import get_text_by_id
with open(filenames['raw'], 'wb') as f:
f.write(get_text_by_id(item))
with open(filenames['raw'], 'rb') as f:
data = f.read()
cnt = 0
for label, filename in filenames.items():
if label == 'raw':
continue
file = ztml.ztml(data, filename, mtf=mtf, ect=ect, bin2txt=label.rsplit('_', 1)[0], element_id=element_id)
cnt += 1
print(f'{cnt} encodings of {item} took {(time()-item_start_time) / 60 :.1f} min.')
# Compare file sizes and validate data is recovered
error |= validation.validate_files(filenames, by='id' * bool(element_id), element=element_id)
print()
if error:
print('Error: some renderings timed out')
else:
print(f'Total of {len(books)} books took {(time()-start_time) / 60 :.1f} min.')
sys.exit(int(error))