# -*- encoding: utf-8; frozen_string_literal: true -*- # #-- # This file is part of HexaPDF. # # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby # Copyright (C) 2014-2022 Thomas Leitner # # HexaPDF is free software: you can redistribute it and/or modify it # under the terms of the GNU Affero General Public License version 3 as # published by the Free Software Foundation with the addition of the # following permission added to Section 15 as permitted in Section 7(a): # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON # INFRINGEMENT OF THIRD PARTY RIGHTS. # # HexaPDF is distributed in the hope that it will be useful, but WITHOUT # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public # License for more details. # # You should have received a copy of the GNU Affero General Public License # along with HexaPDF. If not, see . # # The interactive user interfaces in modified source and object code # versions of HexaPDF must display Appropriate Legal Notices, as required # under Section 5 of the GNU Affero General Public License version 3. # # In accordance with Section 7(b) of the GNU Affero General Public # License, a covered work must retain the producer line in every PDF that # is created or manipulated using HexaPDF. # # If the GNU Affero General Public License doesn't fit your need, # commercial licenses are available at . #++ require 'hexapdf/type/font' require 'hexapdf/stream' require 'hexapdf/font/cmap' module HexaPDF module Type # Represents a composite PDF font. # # Composites fonts wrap a descendant CIDFont and use CIDs to identify glyphs. A CID can be # encoded in one or more bytes and an associated CMap specifies how this encoding is done. # Composite fonts also allow for vertical writing mode and support TrueType as well as OpenType # fonts. # # See: PDF1.7 s9.7 class FontType0 < Font define_field :Subtype, type: Symbol, required: true, default: :Type0 define_field :BaseFont, type: Symbol, required: true define_field :Encoding, type: [Stream, Symbol], required: true define_field :DescendantFonts, type: PDFArray, required: true # Returns the CID font of this type 0 font. def descendant_font cache(:descendant_font) do document.wrap(self[:DescendantFonts][0]) end end # Returns the writing mode which is either :horizontal or :vertical. def writing_mode cmap.wmode == 0 ? :horizontal : :vertical end # Decodes the given string into an array of CIDs. def decode(string) cmap.read_codes(string) end # Returns the UTF-8 string for the given code, or calls the configuration option # 'font.on_missing_unicode_mapping' if no mapping was found. def to_utf8(code) to_unicode_cmap&.to_unicode(code) || ucs2_cmap&.to_unicode(code) || missing_unicode_mapping(code) end # Returns the unscaled width of the given CID in glyph units, or 0 if the width for the code # point is missing. def width(code) descendant_font.width(cmap.to_cid(code)) end # Returns the bounding box of the font or +nil+ if it is not found. def bounding_box descendant_font.bounding_box end # Returns +true+ if the font is embedded. def embedded? descendant_font.embedded? end # Returns the embeeded font file object or +nil+ if the font is not embedded. def font_file descendant_font.font_file end # Returns whether word spacing is applicable when using this font. # # Note that the return value is cached when accessed the first time. # # See: PDF1.7 s9.3.3 def word_spacing_applicable? @word_spacing_applicable ||= ((cmap.read_codes("\x20") && true) rescue false) end private # Returns the CMap used for decoding strings for this font. # # Note that the CMap is cached internally when accessed the first time. def cmap cache(:cmap) do val = self[:Encoding] if val.kind_of?(Symbol) HexaPDF::Font::CMap.for_name(val.to_s) elsif val.kind_of?(HexaPDF::Stream) HexaPDF::Font::CMap.parse(val.stream) else raise HexaPDF::Error, "Unknown value for font's encoding: #{self[:Encoding]}" end end end # Returns the UCS-2 CMap used for extracting text when no ToUnicode CMap is available, or # +nil+ if the UCS-2 CMap could not be determined. # # Note that the CMap is cached internally when accessed the first time. # # See: PDF1.7 s9.10.2 def ucs2_cmap cache(:ucs2_cmap) do encoding = self[:Encoding] system_info = descendant_font[:CIDSystemInfo] registry = system_info[:Registry] ordering = system_info[:Ordering] if (encoding.kind_of?(Symbol) && HexaPDF::Font::CMap.predefined?(encoding.to_s) && encoding != :'Identity-H' && encoding != :'Identity-V') || (registry == "Adobe" && ['GB1', 'CNS1', 'Japan1', 'Korea1'].include?(ordering)) HexaPDF::Font::CMap.for_name("#{registry}-#{ordering}-UCS2") end end end end end end