From 2d95e886ee35dcc6dc0030da910c9bc6e8ec7722 Mon Sep 17 00:00:00 2001 From: Ana Gelez Date: Wed, 17 Apr 2024 16:37:08 +0200 Subject: [PATCH] Use a trait to support both u8 and u16 when writing CMaps --- src/font.rs | 85 +++++++++++++++++++++++++++++++++++------------------ 1 file changed, 57 insertions(+), 28 deletions(-) diff --git a/src/font.rs b/src/font.rs index 3b27437..39295f0 100644 --- a/src/font.rs +++ b/src/font.rs @@ -1,3 +1,5 @@ +use std::marker::PhantomData; + use super::*; /// Writer for a _Type-1 font dictionary_. @@ -653,27 +655,19 @@ impl<'a> Cmap<'a> { deref!('a, Cmap<'a> => Stream<'a>, stream); /// A builder for a `/ToUnicode` character map stream. -pub struct UnicodeCmap { +pub struct UnicodeCmap { buf: Vec, mappings: Vec, count: i32, - /// Are the glyphs IDs represented using one byte only? - one_byte_gids: bool, + glyph_id: PhantomData, } -impl UnicodeCmap { +impl UnicodeCmap +where + G: GlyphId, +{ /// Create a new, empty unicode character map. - pub fn new(name: Name, info: SystemInfo) -> Self { - Self::new_with_dimension(name, info, false) - } - - /// Create a new, empty unicode character map, that supports either one-byte - /// or two-bytes glyph IDs. - /// - /// Most fonts will use two bytes, but for Type3 fonts (which can only contain - /// up to 256 glyphs) some readers (Adobe Acrobat) will only accept one-byte - /// glyph IDs. - pub fn new_with_dimension(name: Name, info: SystemInfo, one_byte_gids: bool) -> Self { + pub fn new_with_dimension(name: Name, info: SystemInfo) -> Self { // https://www.adobe.com/content/dam/acom/en/devnet/font/pdfs/5014.CIDFont_Spec.pdf let mut buf = Vec::new(); @@ -722,33 +716,34 @@ impl UnicodeCmap { // We just cover the whole unicode codespace. buf.extend(b"1 begincodespacerange\n"); - if one_byte_gids { - buf.extend(b"<00> \n"); - } else { - buf.extend(b"<0000> \n"); - } + buf.push(b'<'); + G::MIN.push(&mut buf); + buf.extend(b"> <"); + G::MAX.push(&mut buf); + buf.extend(b">\n"); buf.extend(b"endcodespacerange\n"); - Self { buf, mappings: vec![], count: 0, one_byte_gids } + Self { + buf, + mappings: vec![], + count: 0, + glyph_id: PhantomData, + } } /// Add a mapping from a glyph ID to a codepoint. - pub fn pair(&mut self, glyph: u16, codepoint: char) { + pub fn pair(&mut self, glyph: G, codepoint: char) { self.pair_with_multiple(glyph, [codepoint]); } /// Add a mapping from a glyph ID to multiple codepoints. pub fn pair_with_multiple( &mut self, - glyph: u16, + glyph: G, codepoints: impl IntoIterator, ) { self.mappings.push(b'<'); - if self.one_byte_gids { - self.mappings.push_hex(glyph as u8); - } else { - self.mappings.push_hex_u16(glyph); - } + glyph.push(&mut self.mappings); self.mappings.extend(b"> <"); for c in codepoints { @@ -795,6 +790,40 @@ impl UnicodeCmap { } } +/// Type3 fonts require (in Acrobat at least) IDs in CMaps to be encoded with one byte only, whereas other font types use two bytes. +/// +/// This trait provides an abstraction to support both. +pub trait GlyphId: private::Sealed { + const MIN: Self; + const MAX: Self; + fn push(self, buf: &mut Vec); +} + +impl GlyphId for u8 { + const MIN: Self = u8::MIN; + const MAX: Self = u8::MAX; + + fn push(self, buf: &mut Vec) { + buf.push_hex(self); + } +} + +impl GlyphId for u16 { + const MIN: Self = u16::MIN; + const MAX: Self = u16::MAX; + + fn push(self, buf: &mut Vec) { + buf.push_hex_u16(self); + } +} + +/// Module to seal the `GlyphId` trait. +mod private { + pub trait Sealed {} + impl Sealed for u8 {} + impl Sealed for u16 {} +} + /// Specifics about a character collection. #[derive(Debug, Copy, Clone, Eq, PartialEq, Hash)] pub struct SystemInfo<'a> {