-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathbook.py
105 lines (76 loc) · 3.28 KB
/
book.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
import math # ceil
import collections # deque
import sys # argv
import PyPDF2
import io # StringIO
import argparse
def page_order(n_pages, section_size):
"""Compute page order for booklet printing."""
n_sections = math.ceil(n_pages / (section_size * 4))
pages = list(range(1, 1 + n_sections * section_size * 4))
out_order = []
for _ in range(n_sections):
section_order = []
section_pages, pages = collections.deque(pages[:section_size*4]), pages[section_size*4:]
for _ in range(section_size):
outside_left = section_pages.pop()
outside_right = section_pages.popleft()
inside_left = section_pages.popleft()
inside_right = section_pages.pop()
section_order = [inside_left, inside_right, outside_left, outside_right] + section_order
out_order += section_order
return out_order
def apply_padding(in_file, out_file, pad_to_length):
"""Pad PDF file to specified length with empty pages."""
writer = PyPDF2.PdfFileWriter()
reader = PyPDF2.PdfFileReader(in_file)
in_page_count = reader.getNumPages()
writer.appendPagesFromReader(reader)
for _ in range(pad_to_length - in_page_count):
writer.addBlankPage()
writer.write(out_file)
def reorder_pages(in_file, out_file, page_order):
"""Permute pages of in_file to out_file according to page_order."""
writer = PyPDF2.PdfFileWriter()
reader = PyPDF2.PdfFileReader(in_file)
n_leaves = reader.getNumPages()
assert n_leaves == len(page_order)
for i in page_order:
writer.addPage(reader.getPage(i-1))
writer.write(out_file)
def merge_sheets(in_file, out_file):
"""Merge page pairs into sheets for printing."""
writer = PyPDF2.PdfFileWriter()
reader = PyPDF2.PdfFileReader(in_file)
n_leaves = reader.getNumPages()
assert n_leaves % 2 == 0
for i in range(n_leaves // 2):
i_left = i*2
i_right = i*2 + 1
left_page = reader.getPage(i_left)
right_page = reader.getPage(i_right)
w = left_page.mediaBox.getWidth()
left_page.mergeTranslatedPage(right_page, w, 0, expand=True)
writer.addPage(left_page)
writer.write(out_file)
if __name__ == "__main__":
parser = argparse.ArgumentParser(description="A tool for reordering and merging pages for book(let) binding.")
parser.add_argument("infile", type=argparse.FileType('rb'),
help="Input document")
parser.add_argument("outfile", type=argparse.FileType('wb'),
help="Filepath for booklet-format output")
parser.add_argument("-s", "--section-size", type=int, default=4,
help="Sheets per bound section. Each sheet holds four pages of the input document, two front and two back.\
(e.g. with portraint A4-size input, sheets are landscape A3-size)")
args = parser.parse_args()
infile = args.infile
outfile = args.outfile
section_size = args.section_size
reader = PyPDF2.PdfFileReader(infile)
n_content_pages = reader.getNumPages()
order = page_order(n_content_pages, section_size)
padded_stream = io.BytesIO()
ordered_stream = io.BytesIO()
apply_padding(infile, padded_stream, len(order))
reorder_pages(padded_stream, ordered_stream, order)
merge_sheets(ordered_stream, outfile)