cpdf-source/cpdftype.ml

165 lines
5.0 KiB
OCaml
Raw Normal View History

2021-11-18 20:09:09 +01:00
(* A typesetter for cpdf. A list of elements is manipulated zero or more times
to lay it out, paginate it, and so on. It is then typeset to produce a list
of pages *)
2021-11-18 23:48:25 +01:00
open Pdfutil
2021-11-18 20:09:09 +01:00
(* Text is represented as a list of unicode code points *)
type text = int list
(* Glue *)
type glue =
{glen : float;
stretch : float}
(* Main type *)
2021-11-18 23:48:25 +01:00
type element =
2021-11-18 20:09:09 +01:00
Text of text
| HGlue of glue
| VGlue of glue
| NewLine
| NewPage
2021-11-18 23:48:25 +01:00
| Font of Pdftext.font * float
let string_of_element = function
| Text t -> Pdftext.utf8_of_codepoints t
| HGlue _ -> "HGLUE"
| VGlue _ -> "VGLUE"
| NewLine -> "NewLine"
| NewPage -> "NewPage"
| Font _ -> "Font"
2021-11-18 20:09:09 +01:00
let indent x = HGlue {glen = x; stretch = 0.}
2021-11-18 23:48:25 +01:00
let newpara x = VGlue {glen = x; stretch = 0.}
2021-11-18 20:09:09 +01:00
2021-11-18 23:48:25 +01:00
type t = element list
2021-11-18 20:09:09 +01:00
let of_utf8 = Pdftext.codepoints_of_utf8
let example =
2021-11-18 23:48:25 +01:00
[Font (Pdftext.StandardFont (Pdftext.TimesRoman, Pdftext.WinAnsiEncoding), 12.);
Text (of_utf8 "Jackdaws love my Sphinx of Quartz. And this, this is the second sentence to provoke a line-break.");
NewLine;
2021-11-18 20:09:09 +01:00
newpara 10.;
indent 72.;
2021-11-19 00:32:58 +01:00
Font (Pdftext.StandardFont (Pdftext.TimesItalic, Pdftext.WinAnsiEncoding), 10.);
2021-11-18 20:09:09 +01:00
Text (of_utf8 "The second paragraph");
NewPage]
type state =
2021-11-18 23:48:25 +01:00
{mutable font : Pdftext.font option;
2021-11-18 20:09:09 +01:00
mutable xpos : float;
mutable ypos : float}
let initial_state () =
2021-11-18 23:48:25 +01:00
{font = None;
2021-11-18 20:09:09 +01:00
xpos = 0.;
ypos = 0.}
(* Split text into lines, resolve all hglue stretches to 0, remove Newlines. *)
2021-11-18 23:48:25 +01:00
let layout_element s xpos_max fo = function
2021-11-19 00:23:38 +01:00
| e -> fo e
2021-11-18 23:48:25 +01:00
2021-11-18 20:09:09 +01:00
let layout lmargin rmargin papersize i =
2021-11-19 00:23:38 +01:00
let width =
Pdfunits.convert 72. (Pdfpaper.unit papersize) Pdfunits.PdfPoint (Pdfpaper.width papersize)
in
let o = ref [] in
2021-11-18 23:48:25 +01:00
let s = initial_state () in
let xpos_max = Pdfpaper.width papersize -. lmargin in
2021-11-19 00:23:38 +01:00
s.xpos <- lmargin;
iter (layout_element s xpos_max (fun e -> o := e::!o)) i;
rev !o
2021-11-18 20:09:09 +01:00
(* Resolve all hglue stretches, insert NewPage as needed. *)
let paginate tmargin bmargin papersize i = i
2021-11-18 23:48:25 +01:00
let make_resources fontobjnums =
Pdf.Dictionary
[("/Font", Pdf.Dictionary (map (fun fo -> ("/F" ^ string_of_int fo, Pdf.Indirect fo)) fontobjnums))]
(* At this stage, just Font and Text and HGlue 0. and VGlue 0. and Newline and
NewPage elements. Split on NewPages, typeset each page, add font
dictionaries. New page only
creates a page when that page has content. *)
let typeset lmargin rmargin tmargin bmargin papersize pdf i =
let i = layout lmargin rmargin papersize i in
let i = paginate tmargin bmargin papersize i in
2021-11-19 00:23:38 +01:00
let height = Pdfunits.convert 72. (Pdfpaper.unit papersize) Pdfunits.PdfPoint (Pdfpaper.height papersize) in
2021-11-18 23:48:25 +01:00
let s = initial_state () in
s.xpos <- lmargin;
2021-11-19 00:23:38 +01:00
s.ypos <- tmargin;
2021-11-18 23:48:25 +01:00
let ops = ref [] in
let fonts = ref [] in
let thispagefontnums = ref [] in
let pages = ref [] in
let write_page () =
if !ops <> [] then
let page =
{Pdfpage.content = [Pdfops.stream_of_ops (rev !ops)];
Pdfpage.mediabox = Pdfpage.rectangle_of_paper papersize;
Pdfpage.resources = make_resources !thispagefontnums;
Pdfpage.rotate = Pdfpage.Rotate0;
Pdfpage.rest = Pdf.Dictionary []}
in
pages := page :: !pages
in
let typeset_element = function
| Text cps ->
let charcodestring =
match s.font with
| None -> failwith "font not set up"
| Some f ->
match List.assoc_opt f !fonts with
| Some objnum ->
let extractor =
Pdftext.charcode_extractor_of_font pdf (Pdf.lookup_obj pdf objnum)
in
implode (map char_of_int (option_map extractor cps))
| None -> failwith "font not found"
in
ops :=
2021-11-19 00:23:38 +01:00
Pdfops.Op_Q
::Pdfops.Op_ET
2021-11-18 23:48:25 +01:00
::Pdfops.Op_Tj charcodestring
::Pdfops.Op_BT
::Pdfops.Op_cm (Pdftransform.mktranslate s.xpos (height -. s.ypos))
2021-11-19 00:23:38 +01:00
::Pdfops.Op_q
2021-11-18 23:48:25 +01:00
::!ops
| Font (f, fontsize) ->
let name, objnum =
match List.assoc_opt f !fonts with
| Some objnum -> ("/F" ^ string_of_int objnum, objnum)
| None ->
let num = Pdftext.write_font pdf f in
let n = "/F" ^ string_of_int num in
fonts := (f, num) :: !fonts;
(n, num)
in
s.font <- Some f;
thispagefontnums := objnum :: !thispagefontnums;
ops := Pdfops.Op_Tf (name, fontsize)::!ops
| HGlue {glen} ->
s.xpos <- s.xpos +. glen
| VGlue {glen} ->
2021-11-19 00:23:38 +01:00
s.ypos <- s.ypos +. glen
2021-11-18 23:48:25 +01:00
| NewLine ->
s.xpos <- 0.
| NewPage ->
write_page ();
ops := [];
s.xpos <- 0.;
s.ypos <- 0.
in
iter typeset_element i;
write_page ();
rev !pages
let example_pdf () =
let pdf = Pdf.empty () in
2021-11-19 00:23:38 +01:00
let pages = typeset 20. 20. 20. 20. Pdfpaper.a4 pdf example in
2021-11-18 23:48:25 +01:00
let pdf, pageroot = Pdfpage.add_pagetree pages pdf in
Pdfpage.add_root pageroot [] pdf
2021-11-18 20:09:09 +01:00
2021-11-18 23:48:25 +01:00
let _ =
Pdfwrite.pdf_to_file (example_pdf ()) "out.pdf"