home · contact · privacy
Bookmaker: more expressive output.
[misc] / bookmaker.py
index ca3548bd702eb8425a001b420da2dc73b877a377..d9bf685c0967a492d941b15e25bcd9af6a720751 100755 (executable)
@@ -4,39 +4,61 @@ import argparse
 import io
 from reportlab.lib.pagesizes import A4
 a4_width, a4_height = A4
+points_per_cm = 10 * 72 / 25.4
+cut_depth = 1.95 * points_per_cm
+cut_width = 1.05 * points_per_cm
+middle_point_depth = 0.4 * points_per_cm
+spine_limit = 1 * points_per_cm
 
 parser = argparse.ArgumentParser(description="build print-ready book PDF")
-parser.add_argument("-i", "--input", dest="input_file", action="append", required=True, help="input PDF file")
-parser.add_argument("-o", "--output", dest="output_file", required=True, help="output PDF file")
-parser.add_argument("-p", "--pages", dest="page_range", action="append", help="page range, e.g., '3-end'")
-parser.add_argument("-c", "--crop", dest="crop_range", help="crops left, bottom, right, top – e.g., '10,10,10,10'")
-parser.add_argument("-n", "--nup4", dest="nup4", action='store_true', help="puts 4 input pages onto 1 output page")
-parser.add_argument("-a", "--analyze", dest="analyze", action="store_true", help="print lines identifying spine, page borders")
-parser.add_argument("-t", "--symmetry", dest="symmetry", action="store_true", help="alternate horizontal crops between odd and even pages")
+parser.add_argument("-i", "--input_file", action="append", required=True, help="input PDF file")
+parser.add_argument("-o", "--output_file", required=True, help="output PDF file")
+parser.add_argument("-p", "--page_range", action="append", help="page range, e.g., '3-end'")
+parser.add_argument("-c", "--crop_range", action="append", help="cm crops left, bottom, right, top – e.g., '10,10,10,10'; prefix with ':'-delimited page range to limit effect")
+parser.add_argument("-s", "--symmetry", action="store_true", help="alternate horizontal crops between odd and even pages")
 parser.add_argument("-r", "--rotate", dest="rotate", type=int, action="append", help="rotate page of number by 90° (usable multiple times on same page!)")
-parser.add_argument("-m", "--margin", type=float, default=4.3, help="print margin (default 4.3)")
+parser.add_argument("-n", "--nup4", action='store_true', help="puts 4 input pages onto 1 output page")
+parser.add_argument("-a", "--analyze", action="store_true", help="in --nup4, print lines identifying spine, page borders")
+parser.add_argument("-m", "--margin", type=float, default=0.43, help="print margin for --nup4 in cm (default 0.43)")
 args = parser.parse_args()
 
 
 # select pages from input files
+def parse_page_range(range_string, pages):
+    start_page = 0
+    end_page = len(pages)
+    if range_string:
+        start, end = range_string.split('-')
+        if not (len(start) == 0 or start == "start"):
+            start_page = int(start) - 1
+        if not (len(end) == 0 or end == "end"):
+            end_page = int(end)
+    return start_page, end_page
 pages_to_add = []
 opened_files = []
+new_page_num = 0
 for i, input_file in enumerate(args.input_file):
     file = open(input_file, 'rb')
     opened_files += [file]
     reader = pypdf.PdfReader(file)
-    start_page = 0
-    end_page = len(reader.pages)
+    range_string = None
     if args.page_range and len(args.page_range) > i:
-        start, end = args.page_range[i].split('-')
-        if not (len(start) == 0 or start == "start"):
-            start_page = int(start) - 1
-        if not (len(end) == 0 or end == "end"):
-            end_page = int(end)
-    for page_num in range(start_page, end_page):
-        page = reader.pages[page_num]
+        range_string = args.page_range[i]
+    start_page, end_page = parse_page_range(range_string, reader.pages)
+    for old_page_num in range(start_page, end_page):
+        new_page_num += 1
+        page = reader.pages[old_page_num]
         pages_to_add += [page]
-        print("read in %s page number %d" % (input_file, page_num+1))
+        print("-i, -p: read in %s page number %d as new page %d" % (input_file, old_page_num+1, new_page_num))
+
+# if necessary, pad pages to multiple of 8
+if args.nup4:
+    mod_to_8 = len(pages_to_add) % 8
+    if mod_to_8 > 0:
+        print("-n: number of input pages %d not multiple of 8, padding to that" % len(pages_to_add))
+        for _ in range(8 - mod_to_8):
+            new_page = pypdf.PageObject.create_blank_page(width=a4_width, height=a4_height)
+            pages_to_add += [new_page]
 
 # rotate page canvas
 if args.rotate:
@@ -45,6 +67,7 @@ if args.rotate:
         page.add_transformation(pypdf.Transformation().translate(tx=-a4_width/2, ty=-a4_height/2))
         page.add_transformation(pypdf.Transformation().rotate(-90))
         page.add_transformation(pypdf.Transformation().translate(tx=a4_width/2, ty=a4_height/2))
+        print("-r: rotating (by 90°) page", rotate)
 
 # normalize all pages to portrait A4
 for page in pages_to_add:
@@ -56,56 +79,83 @@ for page in pages_to_add:
     page.mediabox.right = a4_width
     page.cropbox = page.mediabox
 
-# determine page crop
-crop_left, crop_bottom, crop_right, crop_top = 0, 0, 0, 0
-if args.crop_range:
-    crop_left, crop_bottom, crop_right, crop_top = [float(x) for x in  args.crop_range.split(',')]
-cropped_width  = a4_width - crop_left - crop_right
-cropped_height = a4_height - crop_bottom - crop_top
-zoom = 1
+# determine page crops, zooms, crop symmetry
+crops_at_page = [(0,0,0,0)]*len(pages_to_add)
+zoom_at_page = [1]*len(pages_to_add)
 if args.crop_range:
-    zoom_horizontal = a4_width / (a4_width - crop_left - crop_right)
-    zoom_vertical = a4_height / (a4_height - crop_bottom - crop_top)
-    if (zoom_horizontal > 1 and zoom_vertical < 1) or (zoom_horizontal < 1 and zoom_vertical > 1):
-        print("Error: opposing zooms.")
-        exit(1)
-    elif zoom_horizontal + zoom_vertical > 2:
-        zoom = min(zoom_horizontal, zoom_vertical)
-    else:
-        zoom = max(zoom_horizontal, zoom_vertical)
+  for crop_range in args.crop_range:
+      initial_split = crop_range.split(':')
+      if len(initial_split) > 1:
+          page_range = initial_split[0]
+          crops = initial_split[1]
+      else:
+          page_range = None
+          crops = initial_split[0]
+      start_page, end_page = parse_page_range(page_range, pages_to_add)
+      crop_left_cm, crop_bottom_cm, crop_right_cm, crop_top_cm = [float(x) for x in  crops.split(',')]
+      crop_left = crop_left_cm * points_per_cm
+      crop_bottom = crop_bottom_cm * points_per_cm
+      crop_right = crop_right_cm * points_per_cm
+      crop_top = crop_top_cm * points_per_cm
+      if args.symmetry:
+          print("-c, -t: to pages %d to %d applying crops: left %.2fcm, bottom %.2fcm, right %.2fcm, top %.2fcm (but alternating left and right crop between even and odd pages)" % (start_page + 1, end_page, crop_left_cm, crop_bottom_cm, crop_right_cm, crop_top_cm))
+      else:
+          print("-c: to pages %d to %d applying crops: left %.2fcm, bottom %.2fcm, right %.2fcm, top %.2fcm" % (start_page + 1, end_page, crop_left_cm, crop_bottom_cm, crop_right_cm, crop_top_cm))
+      cropped_width  = a4_width - crop_left - crop_right
+      cropped_height = a4_height - crop_bottom - crop_top
+      zoom = 1
+      zoom_horizontal = a4_width / (a4_width - crop_left - crop_right)
+      zoom_vertical = a4_height / (a4_height - crop_bottom - crop_top)
+      if (zoom_horizontal > 1 and zoom_vertical < 1) or (zoom_horizontal < 1 and zoom_vertical > 1):
+          print("Error: opposing zooms.")
+          exit(1)
+      elif zoom_horizontal + zoom_vertical > 2:
+          zoom = min(zoom_horizontal, zoom_vertical)
+      else:
+          zoom = max(zoom_horizontal, zoom_vertical)
+      for page_num in range(start_page, end_page):
+          if args.symmetry and page_num % 2:
+              crops_at_page[page_num] = (crop_right, crop_bottom, crop_left, crop_top)
+          else:
+              crops_at_page[page_num] = (crop_left, crop_bottom, crop_right, crop_top)
+          zoom_at_page[page_num] = zoom
 
 writer = pypdf.PdfWriter()
 if not args.nup4:
+    # single-page output
+    print("building 1-input-page-per-output-page book")
     odd_page = True
-    for page in pages_to_add:
-        if args.symmetry and odd_page:
-            page.add_transformation(pypdf.Transformation().translate(tx=-crop_right, ty=-crop_bottom))
-        else:
-            page.add_transformation(pypdf.Transformation().translate(tx=-crop_left, ty=-crop_bottom))
+    for i, page in enumerate(pages_to_add):
+        crop_left, crop_bottom, crop_right, crop_top = crops_at_page[i]
+        zoom = zoom_at_page[i]
+        page.add_transformation(pypdf.Transformation().translate(tx=-crop_left, ty=-crop_bottom))
         page.add_transformation(pypdf.Transformation().scale(zoom, zoom))
+        cropped_width  = a4_width - crop_left - crop_right
+        cropped_height = a4_height - crop_bottom - crop_top
         page.mediabox.right = cropped_width * zoom
         page.mediabox.top = cropped_height * zoom
         writer.add_page(page)
         odd_page = not odd_page
+        print("built page number %d (of %d)" % (i+1, len(pages_to_add)))
+
 else:
+    print("-n: building 4-input-pages-per-output-page book")
+    print("-m: applying printable-area margin of %.2fcm" % args.margin)
+    if args.analyze:
+        print("-a: drawing page borders, spine limits")
     n_pages_per_axis = 2
-    points_per_mm = 2.83465
-    printable_margin = args.margin * points_per_mm
+    printable_margin = args.margin * points_per_cm
     printable_scale = (a4_width - 2*printable_margin)/a4_width
-    spine_limit = 10 * points_per_mm
     half_width = a4_width / n_pages_per_axis
     half_height = a4_height / n_pages_per_axis
     section_scale_factor = 1 / n_pages_per_axis
     spine_part_of_page = (spine_limit / half_width) / printable_scale
     bonus_shrink_factor = 1 - spine_part_of_page
     new_page_order = []
+    new_i_order = []
     eight_pack = []
-    mod_to_8 = len(pages_to_add) % 8
-    if mod_to_8 > 0:
-        for _ in range(8 - mod_to_8):
-            new_page = pypdf.PageObject.create_blank_page(width=a4_width, height=a4_height)
-            pages_to_add += [new_page]
     i = 0
+    n_eights = 0
     for page in pages_to_add:
         if i == 0:
             eight_pack = []
@@ -113,6 +163,15 @@ else:
         i += 1
         if i == 8:
             i = 0
+            new_i_order += [8 * n_eights + 3,
+                            8 * n_eights + 0,
+                            8 * n_eights + 7,
+                            8 * n_eights + 4,
+                            8 * n_eights + 1,
+                            8 * n_eights + 2,
+                            8 * n_eights + 5,
+                            8 * n_eights + 6]
+            n_eights += 1
             new_page_order += [eight_pack[3]]  # page front, upper left
             new_page_order += [eight_pack[0]]  # page front, upper right
             new_page_order += [eight_pack[7]]  # page front, lower left
@@ -124,22 +183,19 @@ else:
     i = 0
     page_count = 0
     front_page = True
-    for page in new_page_order:
+    for j, page in enumerate(new_page_order):
         if i == 0:
             new_page = pypdf.PageObject.create_blank_page(width=a4_width, height=a4_height)
 
         # in-section transformations: align pages on top, left-hand pages to left, right-hand to right
+        new_i = new_i_order[j]
+        crop_left, crop_bottom, crop_right, crop_top = crops_at_page[new_i]
+        zoom = zoom_at_page[new_i]
         page.add_transformation(pypdf.Transformation().translate(ty=(a4_height / zoom - (a4_height - crop_top))))
         if i == 0 or i == 2:
-            if args.symmetry:
-                page.add_transformation(pypdf.Transformation().translate(tx=-crop_left))
-            else:
-                page.add_transformation(pypdf.Transformation().translate(tx=-crop_right))
+            page.add_transformation(pypdf.Transformation().translate(tx=-crop_left))
         elif i == 1 or i == 3:
-            if args.symmetry:
-                page.add_transformation(pypdf.Transformation().translate(tx=(a4_width / zoom - (a4_width - crop_left))))
-            else:
-                page.add_transformation(pypdf.Transformation().translate(tx=(a4_width / zoom - (a4_width - crop_right))))
+            page.add_transformation(pypdf.Transformation().translate(tx=(a4_width / zoom - (a4_width - crop_right))))
         page.add_transformation(pypdf.Transformation().scale(zoom * bonus_shrink_factor, zoom * bonus_shrink_factor))
         if i == 2 or i == 3:
             page.add_transformation(pypdf.Transformation().translate(ty=-2*printable_margin/printable_scale))
@@ -167,7 +223,7 @@ else:
         page.add_transformation(pypdf.Transformation().scale(section_scale_factor, section_scale_factor))
         new_page.merge_page(page)
         page_count += 1
-        print("merged page number", page_count)
+        print("merged page number %d (of %d)" % (page_count, len(pages_to_add)))
         i += 1
         if i > 3:
             from reportlab.pdfgen import canvas
@@ -201,9 +257,6 @@ else:
                 c.line(x_right_spine_limit, a4_height, x_right_spine_limit, 0)
             if front_page:
                 c.setLineWidth(0.2)
-                cut_depth = 19.5 * points_per_mm
-                cut_width = 10.5 * points_per_mm
-                middle_point_depth = 4 * points_per_mm
 
                 start_up_left_left_x = x_left_spine_limit - 0.5 * cut_width
                 start_up_left_right_x = x_left_spine_limit + 0.5 * cut_width
@@ -228,8 +281,9 @@ else:
             writer.add_page(new_page)
             i = 0
             front_page = not front_page
+
+# write and close
 for file in opened_files:
     file.close()
-
 with open(args.output_file, 'wb') as output_file:
     writer.write(output_file)