2023-11-15 18:26:43 +01:00
|
|
|
open Pdfutil
|
|
|
|
open Cpdferror
|
|
|
|
|
2023-11-20 11:53:51 +01:00
|
|
|
(* Chop a single page into pieces. We prefer the cropbox when available. We set
|
2023-11-28 17:40:50 +01:00
|
|
|
mediabox only, and delete any other boxes. We delete /Annots, since
|
|
|
|
duplicate annotations are not allowed. *)
|
2023-11-29 12:11:09 +01:00
|
|
|
|
2023-11-20 15:12:33 +01:00
|
|
|
let get_box pdf page =
|
|
|
|
match Pdf.lookup_direct pdf "/CropBox" page.Pdfpage.rest with
|
|
|
|
| Some r -> Pdf.parse_rectangle pdf r
|
|
|
|
| None -> Pdf.parse_rectangle pdf page.Pdfpage.mediabox
|
|
|
|
|
|
|
|
let erase_boxes d =
|
|
|
|
let f = Pdf.remove_dict_entry in
|
2023-11-28 17:40:50 +01:00
|
|
|
f (f (f (f (f d "/CropBox") "/BleedBox") "/TrimBox") "/ArtBox") "/Annots"
|
|
|
|
|
|
|
|
let make_pages x y columns btt rtl w h ps move_page =
|
2023-11-29 12:11:09 +01:00
|
|
|
if columns then
|
|
|
|
let column tx =
|
|
|
|
if btt then
|
|
|
|
for ty = 0 to y - 1 do ps =| move_page (w *. float_of_int tx) (h *. float_of_int ty) done
|
|
|
|
else
|
|
|
|
for ty = y - 1 downto 0 do ps =| move_page (w *. float_of_int tx) (h *. float_of_int ty) done
|
|
|
|
in
|
|
|
|
if rtl then for tx = x - 1 downto 0 do column tx done else for tx = 0 to x - 1 do column tx done
|
|
|
|
else
|
|
|
|
let row ty =
|
|
|
|
if rtl then
|
|
|
|
for tx = x - 1 downto 0 do ps =| move_page (w *. float_of_int tx) (h *. float_of_int ty) done
|
|
|
|
else
|
|
|
|
for tx = 0 to x - 1 do ps =| move_page (w *. float_of_int tx) (h *. float_of_int ty) done
|
|
|
|
in
|
|
|
|
if btt then for ty = 0 to y - 1 do row ty done else for ty = y - 1 downto 0 do row ty done
|
2023-11-20 15:12:33 +01:00
|
|
|
|
2024-02-05 15:38:05 +01:00
|
|
|
let chop_boxes line pdf x y columns btt rtl p =
|
|
|
|
let move_page mx my p w h dx dy =
|
|
|
|
let nminx, nminy, nmaxx, nmaxy = (mx +. dx, my +. dy, mx +. w +. dx, my +. h +. dy) in
|
|
|
|
{p with
|
|
|
|
Pdfpage.mediabox = Pdf.Array [Pdf.Real nminx; Pdf.Real nminy; Pdf.Real nmaxx; Pdf.Real nmaxy];
|
|
|
|
Pdfpage.rest = erase_boxes p.Pdfpage.rest}
|
|
|
|
in
|
|
|
|
if x = 0 then
|
|
|
|
(* horizontal split at line *)
|
|
|
|
[]
|
|
|
|
else
|
|
|
|
if y = 0 then
|
|
|
|
(* vertical split at line *)
|
|
|
|
[]
|
|
|
|
else
|
|
|
|
let minx, miny, maxx, maxy = get_box pdf p in
|
|
|
|
let w, h = (maxx -. minx) /. float_of_int x, (maxy -. miny) /. float_of_int y in
|
|
|
|
let ps = ref [] in
|
|
|
|
make_pages x y columns btt rtl w h ps (move_page minx miny p w h);
|
|
|
|
rev !ps
|
2023-11-20 11:53:51 +01:00
|
|
|
|
2024-02-05 15:38:05 +01:00
|
|
|
let chop_inner ~line ~x ~y ~columns ~btt ~rtl pdf range =
|
2023-11-20 11:53:51 +01:00
|
|
|
let pages = Pdfpage.pages_of_pagetree pdf in
|
2023-11-28 17:14:07 +01:00
|
|
|
let pages_out =
|
2023-11-20 11:53:51 +01:00
|
|
|
flatten
|
|
|
|
(map2
|
2024-02-05 15:38:05 +01:00
|
|
|
(fun n p -> if mem n range then chop_boxes line pdf x y columns btt rtl p else [p])
|
2023-11-20 11:53:51 +01:00
|
|
|
(ilist 1 (Pdfpage.endpage pdf))
|
|
|
|
pages)
|
|
|
|
in
|
2023-11-28 17:14:07 +01:00
|
|
|
let changes =
|
|
|
|
let q = ref 0 in
|
|
|
|
flatten
|
|
|
|
(map2
|
|
|
|
(fun n p ->
|
|
|
|
if mem n range
|
|
|
|
then (q += 1; let r = combine (many n (x * y)) (ilist !q (!q + x * y - 1)) in q += (x * y - 1); r)
|
|
|
|
else (q += 1; [(n, !q)]))
|
|
|
|
(ilist 1 (Pdfpage.endpage pdf))
|
|
|
|
pages)
|
|
|
|
in
|
|
|
|
Pdfpage.change_pages ~changes true pdf pages_out
|
2024-02-05 15:01:16 +01:00
|
|
|
|
2024-02-05 15:38:05 +01:00
|
|
|
let chop ~x ~y ~columns ~btt ~rtl pdf range =
|
|
|
|
chop_inner ~line:0. ~x ~y ~columns ~btt ~rtl pdf range
|
2024-02-05 15:01:16 +01:00
|
|
|
|
2024-02-05 15:38:05 +01:00
|
|
|
let chop_hv ~is_h ~line ~columns pdf range =
|
|
|
|
chop_inner ~line ~x:(if is_h then 0 else 1) ~y:(if is_h then 1 else 0) ~columns ~btt:false ~rtl:false pdf range
|