Switch PDF backend to `krilla` (#5420)

Co-authored-by: Laurenz <laurmaedje@gmail.com>
author: Laurenz Stampfl <47084093+LaurenzV@users.noreply.github.com> 2025-04-01 16:42:52 +0200
committer: GitHub <noreply@github.com> 2025-04-01 14:42:52 +0000
commit: 96dd67e011bb317cf78683bcf1edfdfca5e7b6b3 (patch)
tree: 900a0c4e7723af4289685af35d788041055ad4a2 /crates/typst-pdf/src/catalog.rs
parent: 012e14d40cb44997630cf6469a446f217f2e9057 (diff)
1 files changed, 0 insertions, 385 deletions
diff --git a/crates/typst-pdf/src/catalog.rs b/crates/typst-pdf/src/catalog.rs
deleted file mode 100644
index 709b0155..00000000
--- a/crates/typst-pdf/src/catalog.rs
+++ /dev/null
@@ -1,385 +0,0 @@
-use std::num::NonZeroUsize;
-
-use ecow::eco_format;
-use pdf_writer::types::Direction;
-use pdf_writer::writers::PageLabel;
-use pdf_writer::{Finish, Name, Pdf, Ref, Str, TextStr};
-use typst_library::diag::{bail, SourceResult};
-use typst_library::foundations::{Datetime, Smart};
-use typst_library::layout::Dir;
-use typst_library::text::Lang;
-use typst_syntax::Span;
-use xmp_writer::{DateTime, LangId, RenditionClass, XmpWriter};
-
-use crate::page::PdfPageLabel;
-use crate::{hash_base64, outline, TextStrExt, Timestamp, Timezone, WithEverything};
-
-/// Write the document catalog.
-pub fn write_catalog(
-    ctx: WithEverything,
-    pdf: &mut Pdf,
-    alloc: &mut Ref,
-) -> SourceResult<()> {
-    let lang = ctx
-        .resources
-        .languages
-        .iter()
-        .max_by_key(|(_, &count)| count)
-        .map(|(&l, _)| l);
-
-    let dir = if lang.map(Lang::dir) == Some(Dir::RTL) {
-        Direction::R2L
-    } else {
-        Direction::L2R
-    };
-
-    // Write the outline tree.
-    let outline_root_id = outline::write_outline(pdf, alloc, &ctx);
-
-    // Write the page labels.
-    let page_labels = write_page_labels(pdf, alloc, &ctx);
-
-    // Write the document information.
-    let info_ref = alloc.bump();
-    let mut info = pdf.document_info(info_ref);
-    let mut xmp = XmpWriter::new();
-    if let Some(title) = &ctx.document.info.title {
-        info.title(TextStr::trimmed(title));
-        xmp.title([(None, title.as_str())]);
-    }
-
-    if let Some(description) = &ctx.document.info.description {
-        info.subject(TextStr::trimmed(description));
-        xmp.description([(None, description.as_str())]);
-    }
-
-    let authors = &ctx.document.info.author;
-    if !authors.is_empty() {
-        // Turns out that if the authors are given in both the document
-        // information dictionary and the XMP metadata, Acrobat takes a little
-        // bit of both: The first author from the document information
-        // dictionary and the remaining authors from the XMP metadata.
-        //
-        // To fix this for Acrobat, we could omit the remaining authors or all
-        // metadata from the document information catalog (it is optional) and
-        // only write XMP. However, not all other tools (including Apple
-        // Preview) read the XMP data. This means we do want to include all
-        // authors in the document information dictionary.
-        //
-        // Thus, the only alternative is to fold all authors into a single
-        // `<rdf:li>` in the XMP metadata. This is, in fact, exactly what the
-        // PDF/A spec Part 1 section 6.7.3 has to say about the matter. It's a
-        // bit weird to not use the array (and it makes Acrobat show the author
-        // list in quotes), but there's not much we can do about that.
-        let joined = authors.join(", ");
-        info.author(TextStr::trimmed(&joined));
-        xmp.creator([joined.as_str()]);
-    }
-
-    let creator = eco_format!("Typst {}", env!("CARGO_PKG_VERSION"));
-    info.creator(TextStr(&creator));
-    xmp.creator_tool(&creator);
-
-    let keywords = &ctx.document.info.keywords;
-    if !keywords.is_empty() {
-        let joined = keywords.join(", ");
-        info.keywords(TextStr::trimmed(&joined));
-        xmp.pdf_keywords(&joined);
-    }
-    let (date, tz) = document_date(ctx.document.info.date, ctx.options.timestamp);
-    if let Some(pdf_date) = date.and_then(|date| pdf_date(date, tz)) {
-        info.creation_date(pdf_date);
-        info.modified_date(pdf_date);
-    }
-
-    info.finish();
-
-    // A unique ID for this instance of the document. Changes if anything
-    // changes in the frames.
-    let instance_id = hash_base64(&pdf.as_bytes());
-
-    // Determine the document's ID. It should be as stable as possible.
-    const PDF_VERSION: &str = "PDF-1.7";
-    let doc_id = if let Smart::Custom(ident) = ctx.options.ident {
-        // We were provided with a stable ID. Yay!
-        hash_base64(&(PDF_VERSION, ident))
-    } else if ctx.document.info.title.is_some() && !ctx.document.info.author.is_empty() {
-        // If not provided from the outside, but title and author were given, we
-        // compute a hash of them, which should be reasonably stable and unique.
-        hash_base64(&(PDF_VERSION, &ctx.document.info.title, &ctx.document.info.author))
-    } else {
-        // The user provided no usable metadata which we can use as an `/ID`.
-        instance_id.clone()
-    };
-
-    xmp.document_id(&doc_id);
-    xmp.instance_id(&instance_id);
-    xmp.format("application/pdf");
-    xmp.pdf_version("1.7");
-    xmp.language(ctx.resources.languages.keys().map(|lang| LangId(lang.as_str())));
-    xmp.num_pages(ctx.document.pages.len() as u32);
-    xmp.rendition_class(RenditionClass::Proof);
-
-    if let Some(xmp_date) = date.and_then(|date| xmp_date(date, tz)) {
-        xmp.create_date(xmp_date);
-        xmp.modify_date(xmp_date);
-
-        if ctx.options.standards.pdfa {
-            let mut history = xmp.history();
-            history
-                .add_event()
-                .action(xmp_writer::ResourceEventAction::Saved)
-                .when(xmp_date)
-                .instance_id(&eco_format!("{instance_id}_source"));
-            history
-                .add_event()
-                .action(xmp_writer::ResourceEventAction::Converted)
-                .when(xmp_date)
-                .instance_id(&instance_id)
-                .software_agent(&creator);
-        }
-    }
-
-    // Assert dominance.
-    if let Some((part, conformance)) = ctx.options.standards.pdfa_part {
-        let mut extension_schemas = xmp.extension_schemas();
-        extension_schemas
-            .xmp_media_management()
-            .properties()
-            .describe_instance_id();
-        extension_schemas.pdf().properties().describe_all();
-        extension_schemas.finish();
-        xmp.pdfa_part(part);
-        xmp.pdfa_conformance(conformance);
-    }
-
-    let xmp_buf = xmp.finish(None);
-    let meta_ref = alloc.bump();
-    pdf.stream(meta_ref, xmp_buf.as_bytes())
-        .pair(Name(b"Type"), Name(b"Metadata"))
-        .pair(Name(b"Subtype"), Name(b"XML"));
-
-    // Set IDs only now, so that we don't need to clone them.
-    pdf.set_file_id((doc_id.into_bytes(), instance_id.into_bytes()));
-
-    // Write the document catalog.
-    let catalog_ref = alloc.bump();
-    let mut catalog = pdf.catalog(catalog_ref);
-    catalog.pages(ctx.page_tree_ref);
-    catalog.viewer_preferences().direction(dir);
-    catalog.metadata(meta_ref);
-
-    let has_dests = !ctx.references.named_destinations.dests.is_empty();
-    let has_embeddings = !ctx.references.embedded_files.is_empty();
-
-    // Write the `/Names` dictionary.
-    if has_dests || has_embeddings {
-        // Write the named destination tree if there are any entries.
-        let mut name_dict = catalog.names();
-        if has_dests {
-            let mut dests_name_tree = name_dict.destinations();
-            let mut names = dests_name_tree.names();
-            for &(name, dest_ref, ..) in &ctx.references.named_destinations.dests {
-                names.insert(Str(name.resolve().as_bytes()), dest_ref);
-            }
-        }
-
-        if has_embeddings {
-            let mut embedded_files = name_dict.embedded_files();
-            let mut names = embedded_files.names();
-            for (name, file_ref) in &ctx.references.embedded_files {
-                names.insert(Str(name.as_bytes()), *file_ref);
-            }
-        }
-    }
-
-    if has_embeddings && ctx.options.standards.pdfa {
-        // PDF 2.0, but ISO 19005-3 (PDF/A-3) Annex E allows it for PDF/A-3.
-        let mut associated_files = catalog.insert(Name(b"AF")).array().typed();
-        for (_, file_ref) in ctx.references.embedded_files {
-            associated_files.item(file_ref).finish();
-        }
-    }
-
-    // Insert the page labels.
-    if !page_labels.is_empty() {
-        let mut num_tree = catalog.page_labels();
-        let mut entries = num_tree.nums();
-        for (n, r) in &page_labels {
-            entries.insert(n.get() as i32 - 1, *r);
-        }
-    }
-
-    if let Some(outline_root_id) = outline_root_id {
-        catalog.outlines(outline_root_id);
-    }
-
-    if let Some(lang) = lang {
-        catalog.lang(TextStr(lang.as_str()));
-    }
-
-    if ctx.options.standards.pdfa {
-        catalog
-            .output_intents()
-            .push()
-            .subtype(pdf_writer::types::OutputIntentSubtype::PDFA)
-            .output_condition(TextStr("sRGB"))
-            .output_condition_identifier(TextStr("Custom"))
-            .info(TextStr("sRGB IEC61966-2.1"))
-            .dest_output_profile(ctx.globals.color_functions.srgb.unwrap());
-    }
-
-    catalog.finish();
-
-    if ctx.options.standards.pdfa && pdf.refs().count() > 8388607 {
-        bail!(Span::detached(), "too many PDF objects");
-    }
-
-    Ok(())
-}
-
-/// Write the page labels.
-pub(crate) fn write_page_labels(
-    chunk: &mut Pdf,
-    alloc: &mut Ref,
-    ctx: &WithEverything,
-) -> Vec<(NonZeroUsize, Ref)> {
-    // If there is no exported page labeled, we skip the writing
-    if !ctx.pages.iter().filter_map(Option::as_ref).any(|p| {
-        p.label
-            .as_ref()
-            .is_some_and(|l| l.prefix.is_some() || l.style.is_some())
-    }) {
-        return Vec::new();
-    }
-
-    let empty_label = PdfPageLabel::default();
-    let mut result = vec![];
-    let mut prev: Option<&PdfPageLabel> = None;
-
-    // Skip non-exported pages for numbering.
-    for (i, page) in ctx.pages.iter().filter_map(Option::as_ref).enumerate() {
-        let nr = NonZeroUsize::new(1 + i).unwrap();
-        // If there are pages with empty labels between labeled pages, we must
-        // write empty PageLabel entries.
-        let label = page.label.as_ref().unwrap_or(&empty_label);
-
-        if let Some(pre) = prev {
-            if label.prefix == pre.prefix
-                && label.style == pre.style
-                && label.offset == pre.offset.map(|n| n.saturating_add(1))
-            {
-                prev = Some(label);
-                continue;
-            }
-        }
-
-        let id = alloc.bump();
-        let mut entry = chunk.indirect(id).start::<PageLabel>();
-
-        // Only add what is actually provided. Don't add empty prefix string if
-        // it wasn't given for example.
-        if let Some(prefix) = &label.prefix {
-            entry.prefix(TextStr::trimmed(prefix));
-        }
-
-        if let Some(style) = label.style {
-            entry.style(style.to_pdf_numbering_style());
-        }
-
-        if let Some(offset) = label.offset {
-            entry.offset(offset.get() as i32);
-        }
-
-        result.push((nr, id));
-        prev = Some(label);
-    }
-
-    result
-}
-
-/// Resolve the document date.
-///
-/// (1) If the `document.date` is set to specific `datetime` or `none`, use it.
-/// (2) If the `document.date` is set to `auto` or not set, try to use the
-///     date from the options.
-/// (3) Otherwise, we don't write date metadata.
-pub fn document_date(
-    document_date: Smart<Option<Datetime>>,
-    timestamp: Option<Timestamp>,
-) -> (Option<Datetime>, Option<Timezone>) {
-    match (document_date, timestamp) {
-        (Smart::Custom(date), _) => (date, None),
-        (Smart::Auto, Some(timestamp)) => {
-            (Some(timestamp.datetime), Some(timestamp.timezone))
-        }
-        _ => (None, None),
-    }
-}
-
-/// Converts a datetime to a pdf-writer date.
-pub fn pdf_date(datetime: Datetime, tz: Option<Timezone>) -> Option<pdf_writer::Date> {
-    let year = datetime.year().filter(|&y| y >= 0)? as u16;
-
-    let mut pdf_date = pdf_writer::Date::new(year);
-
-    if let Some(month) = datetime.month() {
-        pdf_date = pdf_date.month(month);
-    }
-
-    if let Some(day) = datetime.day() {
-        pdf_date = pdf_date.day(day);
-    }
-
-    if let Some(h) = datetime.hour() {
-        pdf_date = pdf_date.hour(h);
-    }
-
-    if let Some(m) = datetime.minute() {
-        pdf_date = pdf_date.minute(m);
-    }
-
-    if let Some(s) = datetime.second() {
-        pdf_date = pdf_date.second(s);
-    }
-
-    match tz {
-        Some(Timezone::UTC) => {
-            pdf_date = pdf_date.utc_offset_hour(0).utc_offset_minute(0)
-        }
-        Some(Timezone::Local { hour_offset, minute_offset }) => {
-            pdf_date =
-                pdf_date.utc_offset_hour(hour_offset).utc_offset_minute(minute_offset)
-        }
-        None => {}
-    }
-
-    Some(pdf_date)
-}
-
-/// Converts a datetime to an xmp-writer datetime.
-fn xmp_date(
-    datetime: Datetime,
-    timezone: Option<Timezone>,
-) -> Option<xmp_writer::DateTime> {
-    let year = datetime.year().filter(|&y| y >= 0)? as u16;
-    let timezone = timezone.map(|tz| match tz {
-        Timezone::UTC => xmp_writer::Timezone::Utc,
-        Timezone::Local { hour_offset, minute_offset } => {
-            // The xmp-writer use signed integers for the minute offset, which
-            // can be buggy if the minute offset is negative. And because our
-            // minute_offset is ensured to be `0 <= minute_offset < 60`, we can
-            // safely cast it to a signed integer.
-            xmp_writer::Timezone::Local { hour: hour_offset, minute: minute_offset as i8 }
-        }
-    });
-    Some(DateTime {
-        year,
-        month: datetime.month(),
-        day: datetime.day(),
-        hour: datetime.hour(),
-        minute: datetime.minute(),
-        second: datetime.second(),
-        timezone,
-    })
-}
author	Laurenz Stampfl <47084093+LaurenzV@users.noreply.github.com>	2025-04-01 16:42:52 +0200
committer	GitHub <noreply@github.com>	2025-04-01 14:42:52 +0000
commit	96dd67e011bb317cf78683bcf1edfdfca5e7b6b3 (patch)
tree	900a0c4e7723af4289685af35d788041055ad4a2 /crates/typst-pdf/src/catalog.rs
parent	012e14d40cb44997630cf6469a446f217f2e9057 (diff)