# -*- encoding: utf-8; frozen_string_literal: true -*-
#
#--
# This file is part of HexaPDF.
#
# HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
# Copyright (C) 2014-2022 Thomas Leitner
#
# HexaPDF is free software: you can redistribute it and/or modify it
# under the terms of the GNU Affero General Public License version 3 as
# published by the Free Software Foundation with the addition of the
# following permission added to Section 15 as permitted in Section 7(a):
# FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
# THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
# INFRINGEMENT OF THIRD PARTY RIGHTS.
#
# HexaPDF is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with HexaPDF. If not, see .
#
# The interactive user interfaces in modified source and object code
# versions of HexaPDF must display Appropriate Legal Notices, as required
# under Section 5 of the GNU Affero General Public License version 3.
#
# In accordance with Section 7(b) of the GNU Affero General Public
# License, a covered work must retain the producer line in every PDF that
# is created or manipulated using HexaPDF.
#
# If the GNU Affero General Public License doesn't fit your need,
# commercial licenses are available at .
#++
require 'hexapdf/font/type1/font_metrics'
require 'hexapdf/error'
module HexaPDF
module Font
module Type1
# Parses files in the AFM file format.
#
# Note that this implementation isn't a full AFM parser, only what is needed for parsing the
# AFM files for the 14 PDF core fonts is implemented. However, if need be it should be
# adaptable to other AFM files.
#
# For information on the AFM file format have a look at Adobe technical note #5004 - Adobe
# Font Metrics File Format Specification Version 4.1, available at the Adobe website.
#
# == How Parsing Works
#
# AFM is a line oriented format. Each line consists of one or more values of supported types
# (string, name, number, integer, array, boolean) which are separated by whitespace characters
# (space, newline, tab) except for the string type which just uses everything until the end of
# the line.
#
# This parser reads in line by line and the type parsing functions parse a value from the
# front of the line and then remove the parsed part from the line, including trailing
# whitespace characters.
class AFMParser
# :call-seq:
# Parser.parse(filename) -> font_metrics
# Parser.parse(io) -> font_metrics
#
# Parses the IO or file and returns a FontMetrics object.
def self.parse(source)
if source.respond_to?(:read)
new(source).parse
else
File.open(source) {|file| new(file).parse }
end
end
# Creates a new parse for the given IO stream.
def initialize(io)
@io = io
end
# Parses the AFM file and returns a FontMetrics object.
def parse
@metrics = FontMetrics.new
sections = []
each_line do
case (command = parse_name)
when /\AStart/
sections.push(command)
case command
when 'StartCharMetrics' then parse_character_metrics
when 'StartKernPairs' then parse_kerning_pairs
end
when /\AEnd/
sections.pop
break if sections.empty? && command == 'EndFontMetrics'
else
if sections.empty?
parse_global_font_information(command.to_sym)
end
end
end
if @metrics.bounding_box && !@metrics.descender
@metrics.descender = @metrics.bounding_box[1]
end
if @metrics.bounding_box && !@metrics.ascender
@metrics.ascender = @metrics.bounding_box[3]
end
@metrics
end
private
# Parses global font information line for the given +command+ (a symbol).
#
# It is assumed that the command name has already been parsed from the line.
#
# Note that writing direction metrics are also processed here since the standard 14 core
# fonts' AFM files don't have an extra StartDirection section.
def parse_global_font_information(command)
case command
when :FontName then @metrics.font_name = parse_string
when :FullName then @metrics.full_name = parse_string
when :FamilyName then @metrics.family_name = parse_string
when :CharacterSet then @metrics.character_set = parse_string
when :EncodingScheme then @metrics.encoding_scheme = parse_string
when :Weight then @metrics.weight = parse_string
when :FontBBox
@metrics.bounding_box = [parse_number, parse_number, parse_number, parse_number]
when :CapHeight then @metrics.cap_height = parse_number
when :XHeight then @metrics.x_height = parse_number
when :Ascender then @metrics.ascender = parse_number
when :Descender then @metrics.descender = parse_number
when :StdHW then @metrics.dominant_horizontal_stem_width = parse_number
when :StdVW then @metrics.dominant_vertical_stem_width = parse_number
when :UnderlinePosition then @metrics.underline_position = parse_number
when :UnderlineThickness then @metrics.underline_thickness = parse_number
when :ItalicAngle then @metrics.italic_angle = parse_number
when :IsFixedPitch then @metrics.is_fixed_pitch = parse_boolean
end
end
# Parses the character metrics in a StartCharMetrics section.
#
# It is assumed that the StartCharMetrics name has already been parsed from the line.
def parse_character_metrics
parse_integer.times do
read_line
char = CharacterMetrics.new
if @line =~ /C (\S+) ; WX (\S+) ; N (\S+) ; B (\S+) (\S+) (\S+) (\S+) ;((?: L \S+ \S+ ;)+)?/
char.code = $1.to_i
char.width = $2.to_f
char.name = $3.to_sym
char.bbox = [$4.to_i, $5.to_i, $6.to_i, $7.to_i]
if $8
@metrics.ligature_pairs[char.name] = {}
$8.scan(/L (\S+) (\S+)/).each do |name, ligature|
@metrics.ligature_pairs[char.name][name.to_sym] = ligature.to_sym
end
end
end
@metrics.character_metrics[char.name] = char if char.name
@metrics.character_metrics[char.code] = char if char.code != -1
end
end
# Parses the kerning pairs in a StartKernPairs section.
#
# It is assumed that the StartKernPairs name has already been parsed from the line.
def parse_kerning_pairs
parse_integer.times do
read_line
if @line =~ /KPX (\S+) (\S+) (\S+)/
(@metrics.kerning_pairs[$1.to_sym] ||= {})[$2.to_sym] = $3.to_i
end
end
end
# Iterates over all the lines in the IO, yielding every time a line has been read into the
# internal buffer.
def each_line
read_line
unless parse_name == 'StartFontMetrics'
raise HexaPDF::Error, "The AFM file has to start with StartFontMetrics, not #{@line}"
end
until @io.eof?
read_line
yield
end
end
# Reads the next line into the current line variable.
def read_line
@line = @io.readline
end
# Parses and returns the name at the start of the line, with whitespace stripped.
def parse_name
result = @line[/\S+\s*/].to_s
@line[0, result.size] = ''
result.strip!
result
end
# Returns the rest of the line, with whitespace stripped.
def parse_string
@line.strip!
line = @line
@line = ''
line
end
# Parses the integer at the start of the line.
def parse_integer
parse_name.to_i
end
# Parses the float number at the start of the line.
def parse_number
parse_name.to_f
end
# Parses the boolean at the start of the line.
def parse_boolean
parse_name == 'true'
end
end
end
end
end