font/sfnt/sfnt.go - image - Git at Google

 // Copyright 2016 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 //go:generate go run gen.go

 // Package sfnt implements a decoder for SFNT font file formats, including
 // TrueType and OpenType.
 package sfnt // import "golang.org/x/image/font/sfnt"

 // This implementation was written primarily to the
 // https://www.microsoft.com/en-us/Typography/OpenTypeSpecification.aspx
 // specification. Additional documentation is at
 // http://developer.apple.com/fonts/TTRefMan/
 //
 // The pyftinspect tool from https://github.com/fonttools/fonttools is useful
 // for inspecting SFNT fonts.
 //
 // The ttfdump tool is also useful. For example:
 //	ttfdump -t cmap ../testdata/CFFTest.otf dump.txt

 import (
 	"errors"
 	"io"

 	"golang.org/x/image/font"
 	"golang.org/x/image/math/fixed"
 	"golang.org/x/text/encoding/charmap"
 )

 // These constants are not part of the specifications, but are limitations used
 // by this implementation.
 const (
 	// This value is arbitrary, but defends against parsing malicious font
 	// files causing excessive memory allocations. For reference, Adobe's
 	// SourceHanSansSC-Regular.otf has 65535 glyphs and:
 	//	- its format-4  cmap table has  1581 segments.
 	//	- its format-12 cmap table has 16498 segments.
 	//
 	// TODO: eliminate this constraint? If the cmap table is very large, load
 	// some or all of it lazily (at the time Font.GlyphIndex is called) instead
 	// of all of it eagerly (at the time Font.initialize is called), while
 	// keeping an upper bound on the memory used? This will make the code in
 	// cmap.go more complicated, considering that all of the Font methods are
 	// safe to call concurrently, as long as each call has a different *Buffer.
 	maxCmapSegments = 20000

 	maxCompoundRecursionDepth = 8
 	maxCompoundStackSize      = 64
 	maxGlyphDataLength        = 64 * 1024
 	maxHintBits               = 256
 	maxNumFonts               = 256
 	maxNumTables              = 256
 	maxRealNumberStrLen       = 64 // Maximum length in bytes of the "-123.456E-7" representation.

 	// (maxTableOffset + maxTableLength) will not overflow an int32.
 	maxTableLength = 1 << 29
 	maxTableOffset = 1 << 29
 )

 var (
 	// ErrNotFound indicates that the requested value was not found.
 	ErrNotFound = errors.New("sfnt: not found")

 	errInvalidBounds         = errors.New("sfnt: invalid bounds")
 	errInvalidCFFTable       = errors.New("sfnt: invalid CFF table")
 	errInvalidCmapTable      = errors.New("sfnt: invalid cmap table")
 	errInvalidFont           = errors.New("sfnt: invalid font")
 	errInvalidFontCollection = errors.New("sfnt: invalid font collection")
 	errInvalidGlyphData      = errors.New("sfnt: invalid glyph data")
 	errInvalidHeadTable      = errors.New("sfnt: invalid head table")
 	errInvalidKernTable      = errors.New("sfnt: invalid kern table")
 	errInvalidLocaTable      = errors.New("sfnt: invalid loca table")
 	errInvalidLocationData   = errors.New("sfnt: invalid location data")
 	errInvalidMaxpTable      = errors.New("sfnt: invalid maxp table")
 	errInvalidNameTable      = errors.New("sfnt: invalid name table")
 	errInvalidPostTable      = errors.New("sfnt: invalid post table")
 	errInvalidSingleFont     = errors.New("sfnt: invalid single font (data is a font collection)")
 	errInvalidSourceData     = errors.New("sfnt: invalid source data")
 	errInvalidTableOffset    = errors.New("sfnt: invalid table offset")
 	errInvalidTableTagOrder  = errors.New("sfnt: invalid table tag order")
 	errInvalidUCS2String     = errors.New("sfnt: invalid UCS-2 string")

 	errUnsupportedCFFVersion           = errors.New("sfnt: unsupported CFF version")
 	errUnsupportedCmapEncodings        = errors.New("sfnt: unsupported cmap encodings")
 	errUnsupportedCompoundGlyph        = errors.New("sfnt: unsupported compound glyph")
 	errUnsupportedGlyphDataLength      = errors.New("sfnt: unsupported glyph data length")
 	errUnsupportedKernTable            = errors.New("sfnt: unsupported kern table")
 	errUnsupportedRealNumberEncoding   = errors.New("sfnt: unsupported real number encoding")
 	errUnsupportedNumberOfCmapSegments = errors.New("sfnt: unsupported number of cmap segments")
 	errUnsupportedNumberOfFonts        = errors.New("sfnt: unsupported number of fonts")
 	errUnsupportedNumberOfHints        = errors.New("sfnt: unsupported number of hints")
 	errUnsupportedNumberOfTables       = errors.New("sfnt: unsupported number of tables")
 	errUnsupportedPlatformEncoding     = errors.New("sfnt: unsupported platform encoding")
 	errUnsupportedPostTable            = errors.New("sfnt: unsupported post table")
 	errUnsupportedTableOffsetLength    = errors.New("sfnt: unsupported table offset or length")
 	errUnsupportedType2Charstring      = errors.New("sfnt: unsupported Type 2 Charstring")
 )

 // GlyphIndex is a glyph index in a Font.
 type GlyphIndex uint16

 // NameID identifies a name table entry.
 //
 // See the "Name IDs" section of
 // https://www.microsoft.com/typography/otspec/name.htm
 type NameID uint16

 const (
 	NameIDCopyright                  NameID = 0
 	NameIDFamily                            = 1
 	NameIDSubfamily                         = 2
 	NameIDUniqueIdentifier                  = 3
 	NameIDFull                              = 4
 	NameIDVersion                           = 5
 	NameIDPostScript                        = 6
 	NameIDTrademark                         = 7
 	NameIDManufacturer                      = 8
 	NameIDDesigner                          = 9
 	NameIDDescription                       = 10
 	NameIDVendorURL                         = 11
 	NameIDDesignerURL                       = 12
 	NameIDLicense                           = 13
 	NameIDLicenseURL                        = 14
 	NameIDTypographicFamily                 = 16
 	NameIDTypographicSubfamily              = 17
 	NameIDCompatibleFull                    = 18
 	NameIDSampleText                        = 19
 	NameIDPostScriptCID                     = 20
 	NameIDWWSFamily                         = 21
 	NameIDWWSSubfamily                      = 22
 	NameIDLightBackgroundPalette            = 23
 	NameIDDarkBackgroundPalette             = 24
 	NameIDVariationsPostScriptPrefix        = 25
 )

 // Units are an integral number of abstract, scalable "font units". The em
 // square is typically 1000 or 2048 "font units". This would map to a certain
 // number (e.g. 30 pixels) of physical pixels, depending on things like the
 // display resolution (DPI) and font size (e.g. a 12 point font).
 type Units int32

 // scale returns x divided by unitsPerEm, rounded to the nearest fixed.Int26_6
 // value (1/64th of a pixel).
 func scale(x fixed.Int26_6, unitsPerEm Units) fixed.Int26_6 {
 	if x >= 0 {
 		x += fixed.Int26_6(unitsPerEm) / 2
 	} else {
 		x -= fixed.Int26_6(unitsPerEm) / 2
 	}
 	return x / fixed.Int26_6(unitsPerEm)
 }

 func u16(b []byte) uint16 {
 	_ = b[1] // Bounds check hint to compiler.
 	return uint16(b[0])<<8 | uint16(b[1])<<0
 }

 func u32(b []byte) uint32 {
 	_ = b[3] // Bounds check hint to compiler.
 	return uint32(b[0])<<24 | uint32(b[1])<<16 | uint32(b[2])<<8 | uint32(b[3])<<0
 }

 // source is a source of byte data. Conceptually, it is like an io.ReaderAt,
 // except that a common source of SFNT font data is in-memory instead of
 // on-disk: a []byte containing the entire data, either as a global variable
 // (e.g. "goregular.TTF") or the result of an ioutil.ReadFile call. In such
 // cases, as an optimization, we skip the io.Reader / io.ReaderAt model of
 // copying from the source to a caller-supplied buffer, and instead provide
 // direct access to the underlying []byte data.
 type source struct {
 	b []byte
 	r io.ReaderAt

 	// TODO: add a caching layer, if we're using the io.ReaderAt? Note that
 	// this might make a source no longer safe to use concurrently.
 }

 // valid returns whether exactly one of s.b and s.r is nil.
 func (s *source) valid() bool {
 	return (s.b == nil) != (s.r == nil)
 }

 // viewBufferWritable returns whether the []byte returned by source.view can be
 // written to by the caller, including by passing it to the same method
 // (source.view) on other receivers (i.e. different sources).
 //
 // In other words, it returns whether the source's underlying data is an
 // io.ReaderAt, not a []byte.
 func (s *source) viewBufferWritable() bool {
 	return s.b == nil
 }

 // view returns the length bytes at the given offset. buf is an optional
 // scratch buffer to reduce allocations when calling view multiple times. A nil
 // buf is valid. The []byte returned may be a sub-slice of buf[:cap(buf)], or
 // it may be an unrelated slice. In any case, the caller should not modify the
 // contents of the returned []byte, other than passing that []byte back to this
 // method on the same source s.
 func (s *source) view(buf []byte, offset, length int) ([]byte, error) {
 	if 0 > offset || offset > offset+length {
 		return nil, errInvalidBounds
 	}

 	// Try reading from the []byte.
 	if s.b != nil {
 		if offset+length > len(s.b) {
 			return nil, errInvalidBounds
 		}
 		return s.b[offset : offset+length], nil
 	}

 	// Read from the io.ReaderAt.
 	if length <= cap(buf) {
 		buf = buf[:length]
 	} else {
 		// Round length up to the nearest KiB. The slack can lead to fewer
 		// allocations if the buffer is re-used for multiple source.view calls.
 		n := length
 		n += 1023
 		n &^= 1023
 		buf = make([]byte, length, n)
 	}
 	if n, err := s.r.ReadAt(buf, int64(offset)); n != length {
 		return nil, err
 	}
 	return buf, nil
 }

 // u16 returns the uint16 in the table t at the relative offset i.
 //
 // buf is an optional scratch buffer as per the source.view method.
 func (s *source) u16(buf []byte, t table, i int) (uint16, error) {
 	if i < 0 || uint(t.length) < uint(i+2) {
 		return 0, errInvalidBounds
 	}
 	buf, err := s.view(buf, int(t.offset)+i, 2)
 	if err != nil {
 		return 0, err
 	}
 	return u16(buf), nil
 }

 // u32 returns the uint32 in the table t at the relative offset i.
 //
 // buf is an optional scratch buffer as per the source.view method.
 func (s *source) u32(buf []byte, t table, i int) (uint32, error) {
 	if i < 0 || uint(t.length) < uint(i+4) {
 		return 0, errInvalidBounds
 	}
 	buf, err := s.view(buf, int(t.offset)+i, 4)
 	if err != nil {
 		return 0, err
 	}
 	return u32(buf), nil
 }

 // table is a section of the font data.
 type table struct {
 	offset, length uint32
 }

 // ParseCollection parses an SFNT font collection, such as TTC or OTC data,
 // from a []byte data source.
 //
 // If passed data for a single font, a TTF or OTF instead of a TTC or OTC, it
 // will return a collection containing 1 font.
 func ParseCollection(src []byte) (*Collection, error) {
 	c := &Collection{src: source{b: src}}
 	if err := c.initialize(); err != nil {
 		return nil, err
 	}
 	return c, nil
 }

 // ParseCollectionReaderAt parses an SFNT collection, such as TTC or OTC data,
 // from an io.ReaderAt data source.
 //
 // If passed data for a single font, a TTF or OTF instead of a TTC or OTC, it
 // will return a collection containing 1 font.
 func ParseCollectionReaderAt(src io.ReaderAt) (*Collection, error) {
 	c := &Collection{src: source{r: src}}
 	if err := c.initialize(); err != nil {
 		return nil, err
 	}
 	return c, nil
 }

 // Collection is a collection of one or more fonts.
 //
 // All of the Collection methods are safe to call concurrently.
 type Collection struct {
 	src     source
 	offsets []uint32
 }

 // NumFonts returns the number of fonts in the collection.
 func (c *Collection) NumFonts() int { return len(c.offsets) }

 func (c *Collection) initialize() error {
 	// The https://www.microsoft.com/typography/otspec/otff.htm "Font
 	// Collections" section describes the TTC Header.
 	buf, err := c.src.view(nil, 0, 12)
 	if err != nil {
 		return err
 	}
 	// These cases match the switch statement in Font.initializeTables.
 	switch u32(buf) {
 	default:
 		return errInvalidFontCollection
 	case 0x00010000, 0x4f54544f:
 		// Try parsing it as a single font instead of a collection.
 		c.offsets = []uint32{0}
 	case 0x74746366: // "ttcf".
 		numFonts := u32(buf[8:])
 		if numFonts == 0 || numFonts > maxNumFonts {
 			return errUnsupportedNumberOfFonts
 		}
 		buf, err = c.src.view(nil, 12, int(4*numFonts))
 		if err != nil {
 			return err
 		}
 		c.offsets = make([]uint32, numFonts)
 		for i := range c.offsets {
 			o := u32(buf[4*i:])
 			if o > maxTableOffset {
 				return errUnsupportedTableOffsetLength
 			}
 			c.offsets[i] = o
 		}
 	}
 	return nil
 }

 // Font returns the i'th font in the collection.
 func (c *Collection) Font(i int) (*Font, error) {
 	if i < 0 || len(c.offsets) <= i {
 		return nil, ErrNotFound
 	}
 	f := &Font{src: c.src}
 	if err := f.initialize(int(c.offsets[i])); err != nil {
 		return nil, err
 	}
 	return f, nil
 }

 // Parse parses an SFNT font, such as TTF or OTF data, from a []byte data
 // source.
 func Parse(src []byte) (*Font, error) {
 	f := &Font{src: source{b: src}}
 	if err := f.initialize(0); err != nil {
 		return nil, err
 	}
 	return f, nil
 }

 // ParseReaderAt parses an SFNT font, such as TTF or OTF data, from an
 // io.ReaderAt data source.
 func ParseReaderAt(src io.ReaderAt) (*Font, error) {
 	f := &Font{src: source{r: src}}
 	if err := f.initialize(0); err != nil {
 		return nil, err
 	}
 	return f, nil
 }

 // Font is an SFNT font.
 //
 // Many of its methods take a *Buffer argument, as re-using buffers can reduce
 // the total memory allocation of repeated Font method calls, such as measuring
 // and rasterizing every unique glyph in a string of text. If efficiency is not
 // a concern, passing a nil *Buffer is valid, and implies using a temporary
 // buffer for a single call.
 //
 // It is valid to re-use a *Buffer with multiple Font method calls, even with
 // different *Font receivers, as long as they are not concurrent calls.
 //
 // All of the Font methods are safe to call concurrently, as long as each call
 // has a different *Buffer (or nil).
 //
 // The Font methods that don't take a *Buffer argument are always safe to call
 // concurrently.
 //
 // Some methods provide lengths or coordinates, e.g. bounds, font metrics and
 // control points. All of these methods take a ppem parameter, which is the
 // number of pixels in 1 em, expressed as a 26.6 fixed point value. For
 // example, if 1 em is 10 pixels then ppem is fixed.I(10), which equals
 // fixed.Int26_6(10 << 6).
 //
 // To get those lengths or coordinates in terms of font units instead of
 // pixels, use ppem = fixed.Int26_6(f.UnitsPerEm()) and if those methods take a
 // font.Hinting parameter, use font.HintingNone. The return values will have
 // type fixed.Int26_6, but those numbers can be converted back to Units with no
 // further scaling necessary.
 type Font struct {
 	src source

 	// https://www.microsoft.com/typography/otspec/otff.htm#otttables
 	// "Required Tables".
 	cmap table
 	head table
 	hhea table
 	hmtx table
 	maxp table
 	name table
 	os2  table
 	post table

 	// https://www.microsoft.com/typography/otspec/otff.htm#otttables
 	// "Tables Related to TrueType Outlines".
 	//
 	// This implementation does not support hinting, so it does not read the
 	// cvt, fpgm gasp or prep tables.
 	glyf table
 	loca table

 	// https://www.microsoft.com/typography/otspec/otff.htm#otttables
 	// "Tables Related to PostScript Outlines".
 	//
 	// TODO: cff2, vorg?
 	cff table

 	// https://www.microsoft.com/typography/otspec/otff.htm#otttables
 	// "Advanced Typographic Tables".
 	//
 	// TODO: base, gdef, gpos, gsub, jstf, math?

 	// https://www.microsoft.com/typography/otspec/otff.htm#otttables
 	// "Other OpenType Tables".
 	//
 	// TODO: hdmx, vmtx? Others?
 	kern table

 	cached struct {
 		glyphIndex       glyphIndexFunc
 		indexToLocFormat bool // false means short, true means long.
 		isPostScript     bool
 		kernNumPairs     int32
 		kernOffset       int32
 		postTableVersion uint32
 		unitsPerEm       Units

 		// The glyph data for the glyph index i is in
 		// src[locations[i+0]:locations[i+1]].
 		locations []uint32
 	}
 }

 // NumGlyphs returns the number of glyphs in f.
 func (f *Font) NumGlyphs() int { return len(f.cached.locations) - 1 }

 // UnitsPerEm returns the number of units per em for f.
 func (f *Font) UnitsPerEm() Units { return f.cached.unitsPerEm }

 func (f *Font) initialize(offset int) error {
 	if !f.src.valid() {
 		return errInvalidSourceData
 	}
 	buf, isPostScript, err := f.initializeTables(offset)
 	if err != nil {
 		return err
 	}

 	// The order of these parseXxx calls matters. Later calls may depend on
 	// information parsed by earlier calls, such as the maxp table's numGlyphs.
 	// To enforce these dependencies, such information is passed and returned
 	// explicitly, and the f.cached fields are only set afterwards.
 	//
 	// When implementing new parseXxx methods, take care not to call methods
 	// such as Font.NumGlyphs that implicitly depend on f.cached fields.

 	buf, indexToLocFormat, unitsPerEm, err := f.parseHead(buf)
 	if err != nil {
 		return err
 	}
 	buf, numGlyphs, locations, err := f.parseMaxp(buf, indexToLocFormat, isPostScript)
 	if err != nil {
 		return err
 	}
 	buf, glyphIndex, err := f.parseCmap(buf)
 	if err != nil {
 		return err
 	}
 	buf, kernNumPairs, kernOffset, err := f.parseKern(buf)
 	if err != nil {
 		return err
 	}
 	buf, postTableVersion, err := f.parsePost(buf, numGlyphs)
 	if err != nil {
 		return err
 	}

 	f.cached.glyphIndex = glyphIndex
 	f.cached.indexToLocFormat = indexToLocFormat
 	f.cached.isPostScript = isPostScript
 	f.cached.kernNumPairs = kernNumPairs
 	f.cached.kernOffset = kernOffset
 	f.cached.postTableVersion = postTableVersion
 	f.cached.unitsPerEm = unitsPerEm
 	f.cached.locations = locations

 	return nil
 }

 func (f *Font) initializeTables(offset int) (buf1 []byte, isPostScript bool, err error) {
 	// https://www.microsoft.com/typography/otspec/otff.htm "Organization of an
 	// OpenType Font" says that "The OpenType font starts with the Offset
 	// Table", which is 12 bytes.
 	buf, err := f.src.view(nil, offset, 12)
 	if err != nil {
 		return nil, false, err
 	}
 	// When updating the cases in this switch statement, also update the
 	// Collection.initialize method.
 	switch u32(buf) {
 	default:
 		return nil, false, errInvalidFont
 	case 0x00010000:
 		// No-op.
 	case 0x4f54544f: // "OTTO".
 		isPostScript = true
 	case 0x74746366: // "ttcf".
 		return nil, false, errInvalidSingleFont
 	}
 	numTables := int(u16(buf[4:]))
 	if numTables > maxNumTables {
 		return nil, false, errUnsupportedNumberOfTables
 	}

 	// "The Offset Table is followed immediately by the Table Record entries...
 	// sorted in ascending order by tag", 16 bytes each.
 	buf, err = f.src.view(buf, offset+12, 16*numTables)
 	if err != nil {
 		return nil, false, err
 	}
 	for b, first, prevTag := buf, true, uint32(0); len(b) > 0; b = b[16:] {
 		tag := u32(b)
 		if first {
 			first = false
 		} else if tag <= prevTag {
 			return nil, false, errInvalidTableTagOrder
 		}
 		prevTag = tag

 		o, n := u32(b[8:12]), u32(b[12:16])
 		if o > maxTableOffset || n > maxTableLength {
 			return nil, false, errUnsupportedTableOffsetLength
 		}
 		// We ignore the checksums, but "all tables must begin on four byte
 		// boundries [sic]".
 		if o&3 != 0 {
 			return nil, false, errInvalidTableOffset
 		}

 		// Match the 4-byte tag as a uint32. For example, "OS/2" is 0x4f532f32.
 		switch tag {
 		case 0x43464620:
 			f.cff = table{o, n}
 		case 0x4f532f32:
 			f.os2 = table{o, n}
 		case 0x636d6170:
 			f.cmap = table{o, n}
 		case 0x676c7966:
 			f.glyf = table{o, n}
 		case 0x68656164:
 			f.head = table{o, n}
 		case 0x68686561:
 			f.hhea = table{o, n}
 		case 0x686d7478:
 			f.hmtx = table{o, n}
 		case 0x6b65726e:
 			f.kern = table{o, n}
 		case 0x6c6f6361:
 			f.loca = table{o, n}
 		case 0x6d617870:
 			f.maxp = table{o, n}
 		case 0x6e616d65:
 			f.name = table{o, n}
 		case 0x706f7374:
 			f.post = table{o, n}
 		}
 	}
 	return buf, isPostScript, nil
 }

 func (f *Font) parseCmap(buf []byte) (buf1 []byte, glyphIndex glyphIndexFunc, err error) {
 	// https://www.microsoft.com/typography/OTSPEC/cmap.htm

 	const headerSize, entrySize = 4, 8
 	if f.cmap.length < headerSize {
 		return nil, nil, errInvalidCmapTable
 	}
 	u, err := f.src.u16(buf, f.cmap, 2)
 	if err != nil {
 		return nil, nil, err
 	}
 	numSubtables := int(u)
 	if f.cmap.length < headerSize+entrySize*uint32(numSubtables) {
 		return nil, nil, errInvalidCmapTable
 	}

 	var (
 		bestWidth  int
 		bestOffset uint32
 		bestLength uint32
 		bestFormat uint16
 	)

 	// Scan all of the subtables, picking the widest supported one. See the
 	// platformEncodingWidth comment for more discussion of width.
 	for i := 0; i < numSubtables; i++ {
 		buf, err = f.src.view(buf, int(f.cmap.offset)+headerSize+entrySize*i, entrySize)
 		if err != nil {
 			return nil, nil, err
 		}
 		pid := u16(buf)
 		psid := u16(buf[2:])
 		width := platformEncodingWidth(pid, psid)
 		if width <= bestWidth {
 			continue
 		}
 		offset := u32(buf[4:])

 		if offset > f.cmap.length-4 {
 			return nil, nil, errInvalidCmapTable
 		}
 		buf, err = f.src.view(buf, int(f.cmap.offset+offset), 4)
 		if err != nil {
 			return nil, nil, err
 		}
 		format := u16(buf)
 		if !supportedCmapFormat(format, pid, psid) {
 			continue
 		}
 		length := uint32(u16(buf[2:]))

 		bestWidth = width
 		bestOffset = offset
 		bestLength = length
 		bestFormat = format
 	}

 	if bestWidth == 0 {
 		return nil, nil, errUnsupportedCmapEncodings
 	}
 	return f.makeCachedGlyphIndex(buf, bestOffset, bestLength, bestFormat)
 }

 func (f *Font) parseHead(buf []byte) (buf1 []byte, indexToLocFormat bool, unitsPerEm Units, err error) {
 	// https://www.microsoft.com/typography/otspec/head.htm

 	if f.head.length != 54 {
 		return nil, false, 0, errInvalidHeadTable
 	}
 	u, err := f.src.u16(buf, f.head, 18)
 	if err != nil {
 		return nil, false, 0, err
 	}
 	if u == 0 {
 		return nil, false, 0, errInvalidHeadTable
 	}
 	unitsPerEm = Units(u)
 	u, err = f.src.u16(buf, f.head, 50)
 	if err != nil {
 		return nil, false, 0, err
 	}
 	indexToLocFormat = u != 0
 	return buf, indexToLocFormat, unitsPerEm, nil
 }

 func (f *Font) parseKern(buf []byte) (buf1 []byte, kernNumPairs, kernOffset int32, err error) {
 	// https://www.microsoft.com/typography/otspec/kern.htm

 	if f.kern.length == 0 {
 		return buf, 0, 0, nil
 	}
 	const headerSize = 4
 	if f.kern.length < headerSize {
 		return nil, 0, 0, errInvalidKernTable
 	}
 	buf, err = f.src.view(buf, int(f.kern.offset), headerSize)
 	if err != nil {
 		return nil, 0, 0, err
 	}
 	offset := int(f.kern.offset) + headerSize
 	length := int(f.kern.length) - headerSize

 	switch version := u16(buf); version {
 	case 0:
 		// TODO: support numTables != 1. Testing that requires finding such a font.
 		if numTables := int(u16(buf[2:])); numTables != 1 {
 			return nil, 0, 0, errUnsupportedKernTable
 		}
 		return f.parseKernVersion0(buf, offset, length)
 	case 1:
 		if buf[2] != 0 || buf[3] != 0 {
 			return nil, 0, 0, errUnsupportedKernTable
 		}
 		// Microsoft's https://www.microsoft.com/typography/otspec/kern.htm
 		// says that "Apple has extended the definition of the 'kern' table to
 		// provide additional functionality. The Apple extensions are not
 		// supported on Windows."
 		//
 		// The format is relatively complicated, including encoding a state
 		// machine, but rarely seen. We follow Microsoft's and FreeType's
 		// behavior and simply ignore it. Theoretically, we could follow
 		// https://developer.apple.com/fonts/TrueType-Reference-Manual/RM06/Chap6kern.html
 		// but it doesn't seem worth the effort.
 		return buf, 0, 0, nil
 	}
 	return nil, 0, 0, errUnsupportedKernTable
 }

 func (f *Font) parseKernVersion0(buf []byte, offset, length int) (buf1 []byte, kernNumPairs, kernOffset int32, err error) {
 	const headerSize = 6
 	if length < headerSize {
 		return nil, 0, 0, errInvalidKernTable
 	}
 	buf, err = f.src.view(buf, offset, headerSize)
 	if err != nil {
 		return nil, 0, 0, err
 	}
 	if version := u16(buf); version != 0 {
 		return nil, 0, 0, errUnsupportedKernTable
 	}
 	subtableLength := int(u16(buf[2:]))
 	if subtableLength < headerSize || length < subtableLength {
 		return nil, 0, 0, errInvalidKernTable
 	}
 	if coverageBits := buf[5]; coverageBits != 0x01 {
 		// We only support horizontal kerning.
 		return nil, 0, 0, errUnsupportedKernTable
 	}
 	offset += headerSize
 	length -= headerSize
 	subtableLength -= headerSize

 	switch format := buf[4]; format {
 	case 0:
 		return f.parseKernFormat0(buf, offset, subtableLength)
 	case 2:
 		// If we could find such a font, we could write code to support it, but
 		// a comment in the equivalent FreeType code (sfnt/ttkern.c) says that
 		// they've never seen such a font.
 	}
 	return nil, 0, 0, errUnsupportedKernTable
 }

 func (f *Font) parseKernFormat0(buf []byte, offset, length int) (buf1 []byte, kernNumPairs, kernOffset int32, err error) {
 	const headerSize, entrySize = 8, 6
 	if length < headerSize {
 		return nil, 0, 0, errInvalidKernTable
 	}
 	buf, err = f.src.view(buf, offset, headerSize)
 	if err != nil {
 		return nil, 0, 0, err
 	}
 	kernNumPairs = int32(u16(buf))
 	if length != headerSize+entrySize*int(kernNumPairs) {
 		return nil, 0, 0, errInvalidKernTable
 	}
 	return buf, kernNumPairs, int32(offset) + headerSize, nil
 }

 func (f *Font) parseMaxp(buf []byte, indexToLocFormat, isPostScript bool) (buf1 []byte, numGlyphs int, locations []uint32, err error) {
 	// https://www.microsoft.com/typography/otspec/maxp.htm

 	if isPostScript {
 		if f.maxp.length != 6 {
 			return nil, 0, nil, errInvalidMaxpTable
 		}
 	} else {
 		if f.maxp.length != 32 {
 			return nil, 0, nil, errInvalidMaxpTable
 		}
 	}
 	u, err := f.src.u16(buf, f.maxp, 4)
 	if err != nil {
 		return nil, 0, nil, err
 	}
 	numGlyphs = int(u)

 	if isPostScript {
 		p := cffParser{
 			src:    &f.src,
 			base:   int(f.cff.offset),
 			offset: int(f.cff.offset),
 			end:    int(f.cff.offset + f.cff.length),
 		}
 		locations, err = p.parse()
 		if err != nil {
 			return nil, 0, nil, err
 		}
 	} else {
 		locations, err = parseLoca(&f.src, f.loca, f.glyf.offset, indexToLocFormat, numGlyphs)
 		if err != nil {
 			return nil, 0, nil, err
 		}
 	}
 	if len(locations) != numGlyphs+1 {
 		return nil, 0, nil, errInvalidLocationData
 	}

 	return buf, numGlyphs, locations, nil
 }

 func (f *Font) parsePost(buf []byte, numGlyphs int) (buf1 []byte, postTableVersion uint32, err error) {
 	// https://www.microsoft.com/typography/otspec/post.htm

 	const headerSize = 32
 	if f.post.length < headerSize {
 		return nil, 0, errInvalidPostTable
 	}
 	u, err := f.src.u32(buf, f.post, 0)
 	if err != nil {
 		return nil, 0, err
 	}
 	switch u {
 	case 0x20000:
 		if f.post.length < headerSize+2+2*uint32(numGlyphs) {
 			return nil, 0, errInvalidPostTable
 		}
 	case 0x30000:
 		// No-op.
 	default:
 		return nil, 0, errUnsupportedPostTable
 	}
 	return buf, u, nil
 }

 // TODO: API for looking up glyph variants?? For example, some fonts may
 // provide both slashed and dotted zero glyphs ('0'), or regular and 'old
 // style' numerals, and users can direct software to choose a variant.

 type glyphIndexFunc func(f *Font, b *Buffer, r rune) (GlyphIndex, error)

 // GlyphIndex returns the glyph index for the given rune.
 //
 // It returns (0, nil) if there is no glyph for r.
 // https://www.microsoft.com/typography/OTSPEC/cmap.htm says that "Character
 // codes that do not correspond to any glyph in the font should be mapped to
 // glyph index 0. The glyph at this location must be a special glyph
 // representing a missing character, commonly known as .notdef."
 func (f *Font) GlyphIndex(b *Buffer, r rune) (GlyphIndex, error) {
 	return f.cached.glyphIndex(f, b, r)
 }

 func (f *Font) viewGlyphData(b *Buffer, x GlyphIndex) ([]byte, error) {
 	xx := int(x)
 	if f.NumGlyphs() <= xx {
 		return nil, ErrNotFound
 	}
 	i := f.cached.locations[xx+0]
 	j := f.cached.locations[xx+1]
 	if j-i > maxGlyphDataLength {
 		return nil, errUnsupportedGlyphDataLength
 	}
 	return b.view(&f.src, int(i), int(j-i))
 }

 // LoadGlyphOptions are the options to the Font.LoadGlyph method.
 type LoadGlyphOptions struct {
 	// TODO: transform / hinting.
 }

 // LoadGlyph returns the vector segments for the x'th glyph. ppem is the number
 // of pixels in 1 em.
 //
 // If b is non-nil, the segments become invalid to use once b is re-used.
 //
 // It returns ErrNotFound if the glyph index is out of range.
 func (f *Font) LoadGlyph(b *Buffer, x GlyphIndex, ppem fixed.Int26_6, opts *LoadGlyphOptions) ([]Segment, error) {
 	if b == nil {
 		b = &Buffer{}
 	}

 	b.segments = b.segments[:0]
 	if f.cached.isPostScript {
 		buf, err := f.viewGlyphData(b, x)
 		if err != nil {
 			return nil, err
 		}
 		b.psi.type2Charstrings.initialize(b.segments)
 		if err := b.psi.run(psContextType2Charstring, buf); err != nil {
 			return nil, err
 		}
 		b.segments = b.psi.type2Charstrings.segments
 	} else {
 		if err := loadGlyf(f, b, x, 0, 0); err != nil {
 			return nil, err
 		}
 	}

 	// Scale the segments. If we want to support hinting, we'll have to push
 	// the scaling computation into the PostScript / TrueType specific glyph
 	// loading code, such as the appendGlyfSegments body, since TrueType
 	// hinting bytecode works on the scaled glyph vectors. For now, though,
 	// it's simpler to scale as a post-processing step.
 	for i := range b.segments {
 		s := &b.segments[i]
 		for j := range s.Args {
 			s.Args[j] = scale(s.Args[j]*ppem, f.cached.unitsPerEm)
 		}
 	}

 	// TODO: look at opts to transform / hint the Buffer.segments.

 	return b.segments, nil
 }

 // GlyphName returns the name of the x'th glyph.
 //
 // Not every font contains glyph names. If not present, GlyphName will return
 // ("", nil).
 //
 // If present, the glyph name, provided by the font, is assumed to follow the
 // Adobe Glyph List Specification:
 // https://github.com/adobe-type-tools/agl-specification/blob/master/README.md
 //
 // This is also known as the "Adobe Glyph Naming convention", the "Adobe
 // document [for] Unicode and Glyph Names" or "PostScript glyph names".
 //
 // It returns ErrNotFound if the glyph index is out of range.
 func (f *Font) GlyphName(b *Buffer, x GlyphIndex) (string, error) {
 	if int(x) >= f.NumGlyphs() {
 		return "", ErrNotFound
 	}
 	if f.cached.postTableVersion != 0x20000 {
 		return "", nil
 	}
 	if b == nil {
 		b = &Buffer{}
 	}

 	// The wire format for a Version 2 post table is documented at:
 	// https://www.microsoft.com/typography/otspec/post.htm
 	const glyphNameIndexOffset = 34

 	buf, err := b.view(&f.src, int(f.post.offset)+glyphNameIndexOffset+2*int(x), 2)
 	if err != nil {
 		return "", err
 	}
 	u := u16(buf)
 	if u < numBuiltInPostNames {
 		i := builtInPostNamesOffsets[u+0]
 		j := builtInPostNamesOffsets[u+1]
 		return builtInPostNamesData[i:j], nil
 	}
 	// https://developer.apple.com/fonts/TrueType-Reference-Manual/RM06/Chap6post.html
 	// says that "32768 through 65535 are reserved for future use".
 	if u > 32767 {
 		return "", errUnsupportedPostTable
 	}
 	u -= numBuiltInPostNames

 	// Iterate through the list of Pascal-formatted strings. A linear scan is
 	// clearly O(u), which isn't great (as the obvious loop, calling
 	// Font.GlyphName, to get all of the glyph names in a font has quadratic
 	// complexity), but the wire format doesn't suggest a better alternative.

 	offset := glyphNameIndexOffset + 2*f.NumGlyphs()
 	buf, err = b.view(&f.src, int(f.post.offset)+offset, int(f.post.length)-offset)
 	if err != nil {
 		return "", err
 	}

 	for {
 		if len(buf) == 0 {
 			return "", errInvalidPostTable
 		}
 		n := 1 + int(buf[0])
 		if len(buf) < n {
 			return "", errInvalidPostTable
 		}
 		if u == 0 {
 			return string(buf[1:n]), nil
 		}
 		buf = buf[n:]
 		u--
 	}
 }

 // Kern returns the horizontal adjustment for the kerning pair (x0, x1). A
 // positive kern means to move the glyphs further apart. ppem is the number of
 // pixels in 1 em.
 //
 // It returns ErrNotFound if either glyph index is out of range.
 func (f *Font) Kern(b *Buffer, x0, x1 GlyphIndex, ppem fixed.Int26_6, h font.Hinting) (fixed.Int26_6, error) {
 	// TODO: how should this work with the GPOS table and CFF fonts?
 	// https://www.microsoft.com/typography/otspec/kern.htm says that
 	// "OpenType™ fonts containing CFF outlines are not supported by the 'kern'
 	// table and must use the 'GPOS' OpenType Layout table."

 	if n := f.NumGlyphs(); int(x0) >= n || int(x1) >= n {
 		return 0, ErrNotFound
 	}
 	// Not every font has a kern table. If it doesn't, or if that table is
 	// ignored, there's no need to allocate a Buffer.
 	if f.cached.kernNumPairs == 0 {
 		return 0, nil
 	}
 	if b == nil {
 		b = &Buffer{}
 	}

 	key := uint32(x0)<<16 | uint32(x1)
 	lo, hi := int32(0), f.cached.kernNumPairs
 	for lo < hi {
 		i := (lo + hi) / 2

 		// TODO: this view call inside the inner loop can lead to many small
 		// reads instead of fewer larger reads, which can be expensive. We
 		// should be able to do better, although we don't want to make (one)
 		// arbitrarily large read. Perhaps we should round up reads to 4K or 8K
 		// chunks. For reference, Arial.ttf's kern table is 5472 bytes.
 		// Times_New_Roman.ttf's kern table is 5220 bytes.
 		const entrySize = 6
 		buf, err := b.view(&f.src, int(f.cached.kernOffset+i*entrySize), entrySize)
 		if err != nil {
 			return 0, err
 		}

 		k := u32(buf)
 		if k < key {
 			lo = i + 1
 		} else if k > key {
 			hi = i
 		} else {
 			kern := fixed.Int26_6(int16(u16(buf[4:])))
 			kern = scale(kern*ppem, f.cached.unitsPerEm)
 			if h == font.HintingFull {
 				// Quantize the fixed.Int26_6 value to the nearest pixel.
 				kern = (kern + 32) &^ 63
 			}
 			return kern, nil
 		}
 	}
 	return 0, nil
 }

 // Name returns the name value keyed by the given NameID.
 //
 // It returns ErrNotFound if there is no value for that key.
 func (f *Font) Name(b *Buffer, id NameID) (string, error) {
 	if b == nil {
 		b = &Buffer{}
 	}

 	const headerSize, entrySize = 6, 12
 	if f.name.length < headerSize {
 		return "", errInvalidNameTable
 	}
 	buf, err := b.view(&f.src, int(f.name.offset), headerSize)
 	if err != nil {
 		return "", err
 	}
 	numSubtables := u16(buf[2:])
 	if f.name.length < headerSize+entrySize*uint32(numSubtables) {
 		return "", errInvalidNameTable
 	}
 	stringOffset := u16(buf[4:])

 	seen := false
 	for i, n := 0, int(numSubtables); i < n; i++ {
 		buf, err := b.view(&f.src, int(f.name.offset)+headerSize+entrySize*i, entrySize)
 		if err != nil {
 			return "", err
 		}
 		if u16(buf[6:]) != uint16(id) {
 			continue
 		}
 		seen = true

 		var stringify func([]byte) (string, error)
 		switch u32(buf) {
 		default:
 			continue
 		case pidMacintosh<<16 | psidMacintoshRoman:
 			stringify = stringifyMacintosh
 		case pidWindows<<16 | psidWindowsUCS2:
 			stringify = stringifyUCS2
 		}

 		nameLength := u16(buf[8:])
 		nameOffset := u16(buf[10:])
 		buf, err = b.view(&f.src, int(f.name.offset)+int(nameOffset)+int(stringOffset), int(nameLength))
 		if err != nil {
 			return "", err
 		}
 		return stringify(buf)
 	}

 	if seen {
 		return "", errUnsupportedPlatformEncoding
 	}
 	return "", ErrNotFound
 }

 func stringifyMacintosh(b []byte) (string, error) {
 	for _, c := range b {
 		if c >= 0x80 {
 			// b contains some non-ASCII bytes.
 			s, _ := charmap.Macintosh.NewDecoder().Bytes(b)
 			return string(s), nil
 		}
 	}
 	// b contains only ASCII bytes.
 	return string(b), nil
 }

 func stringifyUCS2(b []byte) (string, error) {
 	if len(b)&1 != 0 {
 		return "", errInvalidUCS2String
 	}
 	r := make([]rune, len(b)/2)
 	for i := range r {
 		r[i] = rune(u16(b))
 		b = b[2:]
 	}
 	return string(r), nil
 }

 // Buffer holds re-usable buffers that can reduce the total memory allocation
 // of repeated Font method calls.
 //
 // See the Font type's documentation comment for more details.
 type Buffer struct {
 	// buf is a byte buffer for when a Font's source is an io.ReaderAt.
 	buf []byte
 	// segments holds glyph vector path segments.
 	segments []Segment
 	// compoundStack holds the components of a TrueType compound glyph.
 	compoundStack [maxCompoundStackSize]struct {
 		glyphIndex   GlyphIndex
 		dx, dy       int16
 		hasTransform bool
 		transformXX  int16
 		transformXY  int16
 		transformYX  int16
 		transformYY  int16
 	}
 	// psi is a PostScript interpreter for when the Font is an OpenType/CFF
 	// font.
 	psi psInterpreter
 }

 func (b *Buffer) view(src *source, offset, length int) ([]byte, error) {
 	buf, err := src.view(b.buf, offset, length)
 	if err != nil {
 		return nil, err
 	}
 	// Only update b.buf if it is safe to re-use buf.
 	if src.viewBufferWritable() {
 		b.buf = buf
 	}
 	return buf, nil
 }

 // Segment is a segment of a vector path.
 type Segment struct {
 	Op   SegmentOp
 	Args [6]fixed.Int26_6
 }

 // SegmentOp is a vector path segment's operator.
 type SegmentOp uint32

 const (
 	SegmentOpMoveTo SegmentOp = iota
 	SegmentOpLineTo
 	SegmentOpQuadTo
 	SegmentOpCubeTo
 )

 // translateArgs applies a translation to args.
 func translateArgs(args *[6]fixed.Int26_6, dx, dy fixed.Int26_6) {
 	args[0] += dx
 	args[1] += dy
 	args[2] += dx
 	args[3] += dy
 	args[4] += dx
 	args[5] += dy
 }

 // transformArgs applies an affine transformation to args. The t?? arguments
 // are 2.14 fixed point values.
 func transformArgs(args *[6]fixed.Int26_6, txx, txy, tyx, tyy int16, dx, dy fixed.Int26_6) {
 	args[0], args[1] = tform(txx, txy, tyx, tyy, dx, dy, args[0], args[1])
 	args[2], args[3] = tform(txx, txy, tyx, tyy, dx, dy, args[2], args[3])
 	args[4], args[5] = tform(txx, txy, tyx, tyy, dx, dy, args[4], args[5])
 }

 func tform(txx, txy, tyx, tyy int16, dx, dy, x, y fixed.Int26_6) (newX, newY fixed.Int26_6) {
 	const half = 1 << 13
 	newX = dx +
 		fixed.Int26_6((int64(x)*int64(txx)+half)>>14) +
 		fixed.Int26_6((int64(y)*int64(tyx)+half)>>14)
 	newY = dy +
 		fixed.Int26_6((int64(x)*int64(txy)+half)>>14) +
 		fixed.Int26_6((int64(y)*int64(tyy)+half)>>14)
 	return newX, newY
 }