home · contact · privacy
To Bookmaker, add margin definition.
[misc] / bookmaker.py
1 #!/usr/bin/env python3
2 import pypdf 
3 import argparse
4 import io
5 from reportlab.lib.pagesizes import A4
6 a4_width, a4_height = A4
7
8 parser = argparse.ArgumentParser(description="build print-ready book PDF")
9 parser.add_argument("-i", "--input", dest="input_file", required=True, help="input PDF file")
10 parser.add_argument("-o", "--output", dest="output_file", required=True, help="output PDF file")
11 parser.add_argument("-p", "--pages", dest="page_range", help="page range, e.g., '3-end'")
12 parser.add_argument("-c", "--crop", dest="crop_range", help="crops left, bottom, right, top – e.g., '10,10,10,10'")
13 parser.add_argument("-n", "--nup4", dest="nup4", action='store_true', help="puts 4 input pages onto 1 output page")
14 parser.add_argument("-a", "--analyze", dest="analyze", action="store_true", help="print lines identifying spine, page borders")
15 parser.add_argument("-t", "--symmetry", dest="symmetry", action="store_true", help="alternate horizontal crops between odd and even pages")
16 parser.add_argument("-s", "--second", dest="second", help="append second file as input to append")
17 parser.add_argument("-r", "--rotate", dest="rotate", help="rotate page of number by 90°")
18 parser.add_argument("-m", "--margin", type=float, default=4.3, help="print margin (default 4.3)")
19 args = parser.parse_args()
20
21 with open(args.input_file, 'rb') as file:
22     reader = pypdf.PdfReader(file)
23
24     # determine page range
25     start_page = 0
26     end_page = len(reader.pages)
27     if args.page_range:
28         start, end = args.page_range.split('-')
29         if not (len(start) == 0 or start == "start"):
30             start_page = int(start) - 1 
31         if not (len(end) == 0 or end == "end"):
32             end_page = int(end)
33     pages_to_add = []
34     for page_num in range(start_page, end_page):
35         page = reader.pages[page_num]
36         pages_to_add += [page]
37         print("read in page number", page_num+1)
38
39     # add pages of second PDF
40     if args.second:
41         file2 = open(args.second, 'rb')
42         reader2 = pypdf.PdfReader(file2)
43         page_num = 1
44         for page in reader2.pages:
45             pages_to_add += [page]
46             print("read second PDF's page number", page_num)
47             page_num += 1
48
49     # rotate page canvas
50     if args.rotate:
51         page = pages_to_add[int(args.rotate) - 1]
52         page.add_transformation(pypdf.Transformation().translate(tx=-a4_width/2, ty=-a4_height/2))
53         page.add_transformation(pypdf.Transformation().rotate(-90))
54         page.add_transformation(pypdf.Transformation().translate(tx=a4_width/2, ty=a4_height/2))
55
56     # normalize all pages to portrait A4
57     for page in pages_to_add:
58         if "/Rotate" in page:
59             page.rotate(360 - page["/Rotate"])
60         page.mediabox.left = 0
61         page.mediabox.bottom = 0
62         page.mediabox.top = a4_height 
63         page.mediabox.right = a4_width
64         page.cropbox = page.mediabox
65
66     # determine page crop
67     crop_left, crop_bottom, crop_right, crop_top = 0, 0, 0, 0
68     if args.crop_range:
69         crop_left, crop_bottom, crop_right, crop_top = [float(x) for x in  args.crop_range.split(',')]
70     cropped_width  = a4_width - crop_left - crop_right
71     cropped_height = a4_height - crop_bottom - crop_top  
72     zoom = 1
73     if args.crop_range:
74         zoom_horizontal = a4_width / (a4_width - crop_left - crop_right)
75         zoom_vertical = a4_height / (a4_height - crop_bottom - crop_top)
76         if (zoom_horizontal > 1 and zoom_vertical < 1) or (zoom_horizontal < 1 and zoom_vertical > 1):
77             print("Error: opposing zooms.")
78             exit(1)
79         elif zoom_horizontal + zoom_vertical > 2:
80             zoom = min(zoom_horizontal, zoom_vertical) 
81         else:
82             zoom = max(zoom_horizontal, zoom_vertical) 
83
84     writer = pypdf.PdfWriter()
85     if not args.nup4:
86         odd_page = True
87         for page in pages_to_add:
88             if args.symmetry and odd_page:
89                 page.add_transformation(pypdf.Transformation().translate(tx=-crop_right, ty=-crop_bottom))
90             else:
91                 page.add_transformation(pypdf.Transformation().translate(tx=-crop_left, ty=-crop_bottom))
92             page.add_transformation(pypdf.Transformation().scale(zoom, zoom))
93             page.mediabox.right = cropped_width * zoom
94             page.mediabox.top = cropped_height * zoom
95             writer.add_page(page)
96             odd_page = not odd_page
97     else:
98         n_pages_per_axis = 2
99         points_per_mm = 2.83465
100         printable_margin = args.margin * points_per_mm
101         printable_scale = (a4_width - 2*printable_margin)/a4_width
102         spine_limit = 10 * points_per_mm
103         half_width = a4_width / n_pages_per_axis 
104         half_height = a4_height / n_pages_per_axis 
105         section_scale_factor = 1 / n_pages_per_axis 
106         spine_part_of_page = (spine_limit / half_width) / printable_scale
107         bonus_shrink_factor = 1 - spine_part_of_page
108         new_page_order = []
109         eight_pack = []
110         mod_to_8 = len(pages_to_add) % 8
111         if mod_to_8 > 0:
112             for _ in range(8 - mod_to_8):
113                 new_page = pypdf.PageObject.create_blank_page(width=a4_width, height=a4_height)
114                 pages_to_add += [new_page]
115         i = 0
116         for page in pages_to_add:
117             if i == 0:
118                 eight_pack = []
119             eight_pack += [page]
120             i += 1
121             if i == 8:
122                 i = 0
123                 new_page_order += [eight_pack[3]]  # page front, upper left
124                 new_page_order += [eight_pack[0]]  # page front, upper right
125                 new_page_order += [eight_pack[7]]  # page front, lower left
126                 new_page_order += [eight_pack[4]]  # page front, lower right
127                 new_page_order += [eight_pack[1]]  # page back, upper left
128                 new_page_order += [eight_pack[2]]  # page back, upper right
129                 new_page_order += [eight_pack[5]]  # page back, lower left
130                 new_page_order += [eight_pack[6]]  # page back, lower right
131         i = 0
132         page_count = 0
133         front_page = True
134         for page in new_page_order:
135             if i == 0:
136                 new_page = pypdf.PageObject.create_blank_page(width=a4_width, height=a4_height)
137
138             # in-section transformations: align pages on top, left-hand pages to left, right-hand to right
139             page.add_transformation(pypdf.Transformation().translate(ty=(a4_height / zoom - (a4_height - crop_top))))
140             if i == 0 or i == 2:
141                 if args.symmetry:
142                     page.add_transformation(pypdf.Transformation().translate(tx=-crop_left))
143                 else:
144                     page.add_transformation(pypdf.Transformation().translate(tx=-crop_right))
145             elif i == 1 or i == 3:
146                 if args.symmetry:
147                     page.add_transformation(pypdf.Transformation().translate(tx=(a4_width / zoom - (a4_width - crop_left))))
148                 else:
149                     page.add_transformation(pypdf.Transformation().translate(tx=(a4_width / zoom - (a4_width - crop_right))))
150             page.add_transformation(pypdf.Transformation().scale(zoom * bonus_shrink_factor, zoom * bonus_shrink_factor))
151             if i == 2 or i == 3:
152                 page.add_transformation(pypdf.Transformation().translate(ty=-2*printable_margin/printable_scale))
153
154             # outer section transformations
155             page.add_transformation(pypdf.Transformation().translate(ty=(1-bonus_shrink_factor)*a4_height))
156             if i == 0 or i == 1:
157                 y_section = a4_height
158                 page.mediabox.bottom = half_height
159                 page.mediabox.top    = a4_height 
160             if i == 2 or i == 3:
161                 y_section = 0
162                 page.mediabox.bottom = 0 
163                 page.mediabox.top  =   half_height 
164             if i == 0 or i == 2:
165                 x_section = 0
166                 page.mediabox.left   = 0
167                 page.mediabox.right  = half_width
168             if i == 1 or i == 3:
169                 page.add_transformation(pypdf.Transformation().translate(tx=(1-bonus_shrink_factor)*a4_width))
170                 x_section = a4_width
171                 page.mediabox.left   = half_width 
172                 page.mediabox.right  = a4_width
173             page.add_transformation(pypdf.Transformation().translate(tx=x_section, ty=y_section))
174             page.add_transformation(pypdf.Transformation().scale(section_scale_factor, section_scale_factor))
175             new_page.merge_page(page)
176             page_count += 1
177             print("merged page number", page_count)
178             i += 1
179             if i > 3:
180                 from reportlab.pdfgen import canvas
181                 if args.analyze:
182                     # borders
183                     packet = io.BytesIO()
184                     c = canvas.Canvas(packet, pagesize=A4)
185                     c.setLineWidth(0.1)
186                     c.line(0, a4_height, a4_width, a4_height)
187                     c.line(0, half_height, a4_width, half_height)
188                     c.line(0, 0, a4_width, 0)
189                     c.line(0, a4_height, 0, 0)
190                     c.line(half_width, a4_height, half_width, 0)
191                     c.line(a4_width, a4_height, a4_width, 0)
192                     c.save()
193                     new_pdf = pypdf.PdfReader(packet)
194                     new_page.merge_page(new_pdf.pages[0])
195                 printable_offset_x = printable_margin
196                 printable_offset_y = printable_margin * a4_height / a4_width
197                 new_page.add_transformation(pypdf.Transformation().scale(printable_scale, printable_scale))
198                 new_page.add_transformation(pypdf.Transformation().translate(tx=printable_offset_x, ty=printable_offset_y))
199                 x_left_spine_limit = half_width * bonus_shrink_factor
200                 x_right_spine_limit = a4_width - x_left_spine_limit
201                 if args.analyze or front_page:
202                     packet = io.BytesIO()
203                     c = canvas.Canvas(packet, pagesize=A4)
204                 if args.analyze:
205                     # # spine lines
206                     c.setLineWidth(0.1)
207                     c.line(x_left_spine_limit, a4_height, x_left_spine_limit, 0)
208                     c.line(x_right_spine_limit, a4_height, x_right_spine_limit, 0)
209                 if front_page:
210                     c.setLineWidth(0.2)
211                     cut_depth = 19.5 * points_per_mm
212                     cut_width = 10.5 * points_per_mm
213                     middle_point_depth = 4 * points_per_mm 
214
215                     start_up_left_left_x = x_left_spine_limit - 0.5 * cut_width
216                     start_up_left_right_x = x_left_spine_limit + 0.5 * cut_width
217                     middle_point_up_left_y = half_height + middle_point_depth 
218                     end_point_up_left_y = half_height + cut_depth
219                     c.line(start_up_left_right_x, half_height, x_left_spine_limit, end_point_up_left_y)
220                     c.line(x_left_spine_limit, end_point_up_left_y, x_left_spine_limit, middle_point_up_left_y)
221                     c.line(x_left_spine_limit, middle_point_up_left_y, start_up_left_left_x, half_height)
222
223                     start_down_right_left_x = x_right_spine_limit - 0.5 * cut_width
224                     start_down_right_right_x = x_right_spine_limit + 0.5 * cut_width
225                     middle_point_down_right_y = half_height - middle_point_depth 
226                     end_point_down_right_y = half_height - cut_depth
227                     c.line(start_down_right_left_x, half_height, x_right_spine_limit, end_point_down_right_y)
228                     c.line(x_right_spine_limit, end_point_down_right_y, x_right_spine_limit, middle_point_down_right_y)
229                     c.line(x_right_spine_limit, middle_point_down_right_y, start_down_right_right_x, half_height)
230
231                 if args.analyze or front_page:
232                     c.save()
233                     # packet.seek(0)
234                     new_pdf = pypdf.PdfReader(packet)
235                     new_page.merge_page(new_pdf.pages[0])
236                 writer.add_page(new_page)
237                 i = 0
238                 front_page = not front_page 
239
240     with open(args.output_file, 'wb') as output_file:
241         writer.write(output_file)
242     if args.second:
243         file2.close()