unipdf/pdf/model/font_test.go

package model_test

import (
	"errors"
	"fmt"
	"io"
	"io/ioutil"
	"testing"

	"github.com/unidoc/unidoc/common"
	"github.com/unidoc/unidoc/pdf/core"
	"github.com/unidoc/unidoc/pdf/model"
	"github.com/unidoc/unidoc/pdf/model/fonts"
)

func init() {
	// common.SetLogger(common.NewConsoleLogger(common.LogLevelDebug))
}

var simpleFontDicts = []string{
	`<< /Type /Font
		/BaseFont /Helvetica
		/Subtype /Type1
		/Encoding /WinAnsiEncoding
		>>`,
	`<< /Type /Font
		/BaseFont /Helvetica-Oblique
		/Subtype /Type1
		/Encoding /WinAnsiEncoding
		>>`,
	`<< /Type /Font
		/Subtype /Type1
		/FirstChar 71
		/LastChar 79
		/Widths [ 778 722 278 500 667 556 833 722 778 ]
		/Encoding /WinAnsiEncoding
		/BaseFont /AOMFKK+Helvetica
		>>`,
	`<< /Type /Font
		/Subtype /Type1
		/FirstChar 71
		/LastChar 79
		/Widths [ 778 722 278 500 667 556 833 722 778 ]
		/Encoding /WinAnsiEncoding
		/BaseFont /PETER+Helvetica
		/FontDescriptor <<
			/Type /FontDescriptor
			/Ascent 718
			/CapHeight 718
			/Descent -207
			/Flags 32
			/FontBBox [ -166 -225 1000 931 ]
			/FontName /PETER+Helvetica
			/ItalicAngle 0
			/StemV 88
			/XHeight 523
			/StemH 88
			/CharSet (/G/O)
			%/FontFile3 19 0 R
			>>
		>>`,
}

var compositeFontDicts = []string{
	`<< /Type /Font
		/Subtype /Type0
		/Encoding /Identity-H
		/DescendantFonts [<<
			/Type /Font
			/Subtype /CIDFontType2
			/BaseFont /FLDOLC+PingFangSC-Regular
			/CIDSystemInfo << /Registry (Adobe) /Ordering (Identity) /Supplement 0 >>
			/W [ ]
			/DW 1000
			/FontDescriptor <<
				/Type /FontDescriptor
				/FontName /FLDOLC+PingFangSC-Regular
				/Flags 4
				/FontBBox [-123 -263 1177 1003]
				/ItalicAngle 0
				/Ascent 972
				/Descent -232
				/CapHeight 864
				/StemV 70
				/XHeight 648
				/StemH 64
				/AvgWidth 1000
				/MaxWidth 1300
				% /FontFile3 182 0 R
				>>
			>>]
		/BaseFont /FLDOLC+PingFangSC-Regular
		>>`,
}

func TestNewStandard14Font(t *testing.T) {
	type expect struct {
		subtype  string
		basefont string
		fonts.CharMetrics
	}
	tests := map[string]expect{
		"Courier": expect{
			subtype:     "Type1",
			basefont:    "Courier",
			CharMetrics: fonts.CharMetrics{Wx: 600, Wy: 0}},
	}

	for in, expect := range tests {
		font, err := model.NewStandard14Font(in)
		if err != nil {
			t.Fatalf("%s: %v", in, err)
		}
		if font.Subtype() != expect.subtype || font.BaseFont() != expect.basefont {
			t.Fatalf("%s: expected BaseFont=%s SubType=%s, but got BaseFont=%s SubType=%s",
				in, expect.basefont, expect.subtype, font.BaseFont(), font.Subtype())
		}

		metrics, ok := font.GetGlyphCharMetrics("space")
		if !ok {
			t.Fatalf("%s: failed to get glyph metric", in)
		}
		if metrics.Wx != expect.Wx || metrics.Wy != expect.Wy {
			t.Fatalf("%s: expected glyph metrics is Wx=%f Wy=%f, but got Wx=%f Wy=%f",
				in, expect.Wx, expect.Wy, metrics.Wx, metrics.Wy)
		}
	}
}

// TestSimpleFonts checks that we correctly recreate simple fonts that we parse.
func TestSimpleFonts(t *testing.T) {
	for _, d := range simpleFontDicts {
		objFontObj(t, d)
	}
}

// TestCompositeFonts checks that we correctly recreate composite fonts that we parse.
func TestCompositeFonts(t *testing.T) {
	for _, d := range compositeFontDicts {
		objFontObj(t, d)
	}
}

// TestCharcodeBytesToUnicode checks that CharcodeBytesToUnicode is working for the tests in
// ToUnicode cmap.
func TestCharcodeBytesToUnicode(t *testing.T) {
	for _, test := range charcodeBytesToUnicodeTest {
		test.check(t)
	}
}

var charcodeBytesToUnicodeTest = []fontFragmentTest{
	fontFragmentTest{"Test beginbfchar and beginbfrange cmap entries",
		"testdata/Yemeni.txt", 470,
		[]byte{0x1, 0xa8, 0x1, 0xb3, 0x1, 0xc2, 0x1, 0xcc, 0x1, 0xe7, 0x1, 0xef, 0x1, 0xf3, 0x0,
			0x20, 0x1, 0xa2, 0x1, 0xfc, 0x2, 0x8, 0x1, 0xa6, 0x1, 0xe7, 0x0, 0x20, 0x2, 0xb, 0x0,
			0x20, 0x2, 0xf, 0x0, 0x20, 0x0, 0x20, 0x1, 0xdd, 0x0, 0x20, 0x0, 0xcd, 0x0, 0xce, 0x0,
			0xcf, 0x0, 0xd0, 0x0, 0xd1, 0x1, 0xa1, 0x0, 0x20, 0x1, 0xa9, 0x2, 0x1},
		"ﺔﺟﺮﺸﻓﻛﻟ ﺎﻨﻴﺒﻓ ﻷ ﻻ  ﻉ ٠١٢٣٤ﺍ ﺕﻭ",
	},
	fontFragmentTest{"TrueType font with ToUnicode cmap",
		"testdata/print_alerts.txt", 9,
		[]byte{43, 40, 41, 34, 37, 42, 38, 49, 36, 38, 48, 34, 35, 36, 37, 35, 36, 58},
		"Alerts on printing",
	},
	fontFragmentTest{"Type0 font with ToUnicode cmap",
		"testdata/CollazoBio.txt", 7,
		[]byte{255, 50, 255, 65, 255, 78, 255, 68, 255, 79, 255, 77, 0, 32, 0, 32, 255, 77, 255, 65,
			255, 84, 255, 82, 255, 73, 255, 67, 255, 69, 255, 83, 0, 46},
		"Ｒａｎｄｏｍ  ｍａｔｒｉｃｅｓ.",
	},
	fontFragmentTest{"Type1 font with FontFile entry",
		"testdata/lm.txt", 7,
		[]byte{102, 65, 106, 66, 103},
		"{A|B}",
	},
}

type fontFragmentTest struct {
	description string
	filename    string
	objNum      int
	data        []byte
	expected    string
}

func (f *fontFragmentTest) String() string {
	return fmt.Sprintf("TEST{%q file=%q obj=%d|", f.description, f.filename, f.objNum)
}

// check loads the font in PDF fragment `filename`, object number `objNum`, runs
// CharcodeBytesToUnicode on `data` and checks that output equals `expected`.
func (f *fontFragmentTest) check(t *testing.T) {
	common.Log.Debug("fontFragmentTest: %s", f.description)
	numObj, err := parsePdfFragment(f.filename)
	if err != nil {
		t.Errorf("Failed to parse. %s err=%v", f, err)
		return
	}
	fontObj := numObj[f.objNum]
	font, err := model.NewPdfFontFromPdfObject(fontObj)
	if err != nil {
		t.Errorf("Failed to create font. %s err=%v", f, err)
		return
	}

	actualText, numChars, numMisses := font.CharcodeBytesToUnicode(f.data)
	if numMisses != 0 {
		t.Errorf("Some codes not decoded. numMisses=%d", numMisses)
		return
	}
	if actualText != f.expected {
		t.Errorf("Incorrect decoding. %s\nexpected=%q\n  actual=%q",
			f, f.expected, actualText)
	}
	if numChars != len([]rune(actualText)) {
		t.Errorf("Incorrect numChars. %s numChars=%d expected=%d",
			f, numChars, len(actualText))
	}
}

// objFontObj parses `fontDict` to a make a Font, creates a PDF object from the Font and checks that
// the new PDF object is the same as the input object
func objFontObj(t *testing.T, fontDict string) error {

	parser := core.NewParserFromString(fontDict)
	obj, err := parser.ParseDict()
	if err != nil {
		t.Errorf("objFontObj: Failed to parse dict obj. fontDict=%q err=%v", fontDict, err)
		return err
	}
	font, err := model.NewPdfFontFromPdfObject(obj)
	if err != nil {
		t.Errorf("Failed to parse font object. obj=%s err=%v", obj, err)
		return err
	}

	// Resolve all the indirect references in the font objects so we can compare their contents.
	obj1 := core.FlattenObject(obj)
	obj2 := core.FlattenObject(font.ToPdfObject())

	// Check that the reconstituted font is the same as the original.
	if !core.EqualObjects(obj1, obj2) {
		t.Errorf("Different objects.\nobj1=%s\nobj2=%s\nfont=%s", obj1, obj2, font)
		return errors.New("different objects")
	}

	return nil
}

// parsePdfFragment parses a file containing fragments of a PDF `filename` (see
// charcodeBytesToUnicodeTest) and returns a map of {object number: object} with indirect objects
// replaced by their values if they are in `filename`.
func parsePdfFragment(filename string) (map[int]core.PdfObject, error) {
	data, err := ioutil.ReadFile(filename)
	if err != nil {
		return nil, err
	}
	return parsePdfObjects(string(data))
}

// parsePdfObjects parses a fragment of a PDF `text` and returns a map of {object number: object}
// with indirect objects replaced by their values if they are in `text`.
func parsePdfObjects(text string) (map[int]core.PdfObject, error) {
	numObj := map[int]core.PdfObject{}
	parser := core.NewParserFromString(text)

	// Build the numObj {object number: object} map
	nums := []int{}
	for {
		obj, err := parser.ParseIndirectObject()
		if err != nil {
			if err == io.EOF {
				break
			}
			return numObj, err
		}
		switch t := obj.(type) {
		case *core.PdfIndirectObject:
			numObj[int(t.ObjectNumber)] = obj
			nums = append(nums, int(t.ObjectNumber))
		case *core.PdfObjectStream:
			numObj[int(t.ObjectNumber)] = obj
			nums = append(nums, int(t.ObjectNumber))
		}
	}

	common.Log.Debug("parsePdfObjects: Parsed %d objects %+v", len(numObj), nums)

	// Replace the indirect objects in all dicts and arrays with their values, if they are in numObj.
	for n, obj := range numObj {
		common.Log.Debug("-- 0 %d obj %T", n, obj)
		iobj, ok := obj.(*core.PdfIndirectObject)
		if !ok {
			continue
		}
		common.Log.Debug("   -- %T", iobj.PdfObject)
		iobj.PdfObject, ok = replaceReferences(numObj, iobj.PdfObject)
		if !ok {
			common.Log.Debug("ERROR: unresolved reference")
		}
	}
	return numObj, nil
}

// replaceReferences replaces the object references in all dicts and arrays with their values, if
// they are in numObj. The boolean return is true if all object references were successfuly
// replaced.
func replaceReferences(numObj map[int]core.PdfObject, obj core.PdfObject) (core.PdfObject, bool) {
	var ok bool
	switch t := obj.(type) {
	case *core.PdfObjectReference:
		o, ok := numObj[int(t.ObjectNumber)]
		common.Log.Debug("    %d 0 R  %t ", t.ObjectNumber, ok)
		return o, ok
	case *core.PdfObjectDictionary:
		for _, k := range t.Keys() {
			o := t.Get(k)
			o, ok = replaceReferences(numObj, o)
			if !ok {
				return o, ok
			}
			t.Set(k, o)
		}
	case *core.PdfObjectArray:
		for i, o := range *t {
			o, ok = replaceReferences(numObj, o)
			if !ok {
				return o, ok
			}
			(*t)[i] = o
		}
	}
	return obj, true
}
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+								package model_test
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
 								import (
 									"errors"
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									"fmt"
 									"io"
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+									"io/ioutil"
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+									"testing"
-												Added a test for CharcodeBytesToUnicode for Type0 ToUnicode cmaps

											
										
										
											2018-07-19 10:28:23 +10:00
+									"github.com/unidoc/unidoc/common"
-												Don't import core anonymously

											
										
										
											2018-07-15 17:29:27 +10:00
+									"github.com/unidoc/unidoc/pdf/core"
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+									"github.com/unidoc/unidoc/pdf/model"
 									"github.com/unidoc/unidoc/pdf/model/fonts"
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+								)
 								func init() {
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+									// common.SetLogger(common.NewConsoleLogger(common.LogLevelDebug))
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+								}
-												Simplified font.go. Made ToUnicode cmap private. Removed duplicate ToUnicode from Type0 font

											
										
										
											2018-06-28 11:06:23 +10:00
+								var simpleFontDicts = []string{
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+									`<< /Type /Font
 										/BaseFont /Helvetica
 										/Subtype /Type1
 										/Encoding /WinAnsiEncoding
 										>>`,
 									`<< /Type /Font
 										/BaseFont /Helvetica-Oblique
 										/Subtype /Type1
 										/Encoding /WinAnsiEncoding
 										>>`,
 									`<< /Type /Font
 										/Subtype /Type1
 										/FirstChar 71
 										/LastChar 79
 										/Widths [ 778 722 278 500 667 556 833 722 778 ]
 										/Encoding /WinAnsiEncoding
 										/BaseFont /AOMFKK+Helvetica
 										>>`,
 									`<< /Type /Font
 										/Subtype /Type1
 										/FirstChar 71
 										/LastChar 79
 										/Widths [ 778 722 278 500 667 556 833 722 778 ]
 										/Encoding /WinAnsiEncoding
 										/BaseFont /PETER+Helvetica
 										/FontDescriptor <<
 											/Type /FontDescriptor
 											/Ascent 718
 											/CapHeight 718
 											/Descent -207
 											/Flags 32
 											/FontBBox [ -166 -225 1000 931 ]
 											/FontName /PETER+Helvetica
 											/ItalicAngle 0
 											/StemV 88
 											/XHeight 523
 											/StemH 88
 											/CharSet (/G/O)
 											%/FontFile3 19 0 R
 											>>
 										>>`,
 								}
-												Got Type0 font -> obj -> font test passing

											
										
										
											2018-06-29 18:09:44 +10:00
+								var compositeFontDicts = []string{
 									`<< /Type /Font
 										/Subtype /Type0
 										/Encoding /Identity-H
 										/DescendantFonts [<<
 											/Type /Font
 											/Subtype /CIDFontType2
 											/BaseFont /FLDOLC+PingFangSC-Regular
 											/CIDSystemInfo << /Registry (Adobe) /Ordering (Identity) /Supplement 0 >>
 											/W [ ]
 											/DW 1000
 											/FontDescriptor <<
 												/Type /FontDescriptor
 												/FontName /FLDOLC+PingFangSC-Regular
 												/Flags 4
 												/FontBBox [-123 -263 1177 1003]
 												/ItalicAngle 0
 												/Ascent 972
 												/Descent -232
 												/CapHeight 864
 												/StemV 70
 												/XHeight 648
 												/StemH 64
 												/AvgWidth 1000
 												/MaxWidth 1300
 												% /FontFile3 182 0 R
 												>>
 											>>]
 										/BaseFont /FLDOLC+PingFangSC-Regular
 										>>`,
 								}
-												Modify log messages

											
										
										
											2018-07-09 18:10:38 +10:00
+								func TestNewStandard14Font(t *testing.T) {
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+									type expect struct {
 										subtype  string
 										basefont string
 										fonts.CharMetrics
 									}
 									tests := map[string]expect{
 										"Courier": expect{
 											subtype:     "Type1",
 											basefont:    "Courier",
 											CharMetrics: fonts.CharMetrics{Wx: 600, Wy: 0}},
 									}
 									for in, expect := range tests {
-												Modify log messages

											
										
										
											2018-07-09 18:10:38 +10:00
+										font, err := model.NewStandard14Font(in)
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+										if err != nil {
-												Modify log messages

											
										
										
											2018-07-09 18:10:38 +10:00
+											t.Fatalf("%s: %v", in, err)
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+										}
-												Modify log messages

											
										
										
											2018-07-09 18:10:38 +10:00
+										if font.Subtype() != expect.subtype || font.BaseFont() != expect.basefont {
 											t.Fatalf("%s: expected BaseFont=%s SubType=%s, but got BaseFont=%s SubType=%s",
 												in, expect.basefont, expect.subtype, font.BaseFont(), font.Subtype())
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+										}
-												Modify log messages

											
										
										
											2018-07-09 18:10:38 +10:00
+										metrics, ok := font.GetGlyphCharMetrics("space")
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+										if !ok {
-												Modify log messages

											
										
										
											2018-07-09 18:10:38 +10:00
+											t.Fatalf("%s: failed to get glyph metric", in)
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+										}
 										if metrics.Wx != expect.Wx || metrics.Wy != expect.Wy {
-												Abort test if error occurs

											
										
										
											2018-07-10 08:57:16 +10:00
+											t.Fatalf("%s: expected glyph metrics is Wx=%f Wy=%f, but got Wx=%f Wy=%f",
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+												in, expect.Wx, expect.Wy, metrics.Wx, metrics.Wy)
 										}
 									}
 								}
-												Simplified font.go. Made ToUnicode cmap private. Removed duplicate ToUnicode from Type0 font

											
										
										
											2018-06-28 11:06:23 +10:00
+								// TestSimpleFonts checks that we correctly recreate simple fonts that we parse.
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+								func TestSimpleFonts(t *testing.T) {
-												Simplified font.go. Made ToUnicode cmap private. Removed duplicate ToUnicode from Type0 font

											
										
										
											2018-06-28 11:06:23 +10:00
+									for _, d := range simpleFontDicts {
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+										objFontObj(t, d)
 									}
 								}
-												Got Type0 font -> obj -> font test passing

											
										
										
											2018-06-29 18:09:44 +10:00
+								// TestCompositeFonts checks that we correctly recreate composite fonts that we parse.
 								func TestCompositeFonts(t *testing.T) {
 									for _, d := range compositeFontDicts {
 										objFontObj(t, d)
 									}
 								}
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+								// TestCharcodeBytesToUnicode checks that CharcodeBytesToUnicode is working for the tests in
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+								// ToUnicode cmap.
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+								func TestCharcodeBytesToUnicode(t *testing.T) {
 									for _, test := range charcodeBytesToUnicodeTest {
 										test.check(t)
 									}
 								}
 								var charcodeBytesToUnicodeTest = []fontFragmentTest{
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+									fontFragmentTest{"Test beginbfchar and beginbfrange cmap entries",
 										"testdata/Yemeni.txt", 470,
 										[]byte{0x1, 0xa8, 0x1, 0xb3, 0x1, 0xc2, 0x1, 0xcc, 0x1, 0xe7, 0x1, 0xef, 0x1, 0xf3, 0x0,
 x20, 0x1, 0xa2, 0x1, 0xfc, 0x2, 0x8, 0x1, 0xa6, 0x1, 0xe7, 0x0, 0x20, 0x2, 0xb, 0x0,
 x20, 0x2, 0xf, 0x0, 0x20, 0x0, 0x20, 0x1, 0xdd, 0x0, 0x20, 0x0, 0xcd, 0x0, 0xce, 0x0,
 xcf, 0x0, 0xd0, 0x0, 0xd1, 0x1, 0xa1, 0x0, 0x20, 0x1, 0xa9, 0x2, 0x1},
 										"ﺔﺟﺮﺸﻓﻛﻟ ﺎﻨﻴﺒﻓ ﻷ ﻻ  ﻉ ٠١٢٣٤ﺍ ﺕﻭ",
 									},
-												Added a test for CharcodeBytesToUnicode for Type0 ToUnicode cmaps

											
										
										
											2018-07-19 10:28:23 +10:00
+									fontFragmentTest{"TrueType font with ToUnicode cmap",
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+										"testdata/print_alerts.txt", 9,
 										[]byte{43, 40, 41, 34, 37, 42, 38, 49, 36, 38, 48, 34, 35, 36, 37, 35, 36, 58},
 										"Alerts on printing",
 									},
-												Added a test for CharcodeBytesToUnicode for Type0 ToUnicode cmaps

											
										
										
											2018-07-19 10:28:23 +10:00
+									fontFragmentTest{"Type0 font with ToUnicode cmap",
 										"testdata/CollazoBio.txt", 7,
 										[]byte{255, 50, 255, 65, 255, 78, 255, 68, 255, 79, 255, 77, 0, 32, 0, 32, 255, 77, 255, 65,
 , 84, 255, 82, 255, 73, 255, 67, 255, 69, 255, 83, 0, 46},
 										"Ｒａｎｄｏｍ  ｍａｔｒｉｃｅｓ.",
 									},
 									fontFragmentTest{"Type1 font with FontFile entry",
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+										"testdata/lm.txt", 7,
 										[]byte{102, 65, 106, 66, 103},
 										"{A|B}",
 									},
 								}
 								type fontFragmentTest struct {
 									description string
 									filename    string
 									objNum      int
 									data        []byte
 									expected    string
 								}
 								func (f *fontFragmentTest) String() string {
 									return fmt.Sprintf("TEST{%q file=%q obj=%d|", f.description, f.filename, f.objNum)
 								}
 								// check loads the font in PDF fragment `filename`, object number `objNum`, runs
 								// CharcodeBytesToUnicode on `data` and checks that output equals `expected`.
 								func (f *fontFragmentTest) check(t *testing.T) {
-												Added a test for CharcodeBytesToUnicode for Type0 ToUnicode cmaps

											
										
										
											2018-07-19 10:28:23 +10:00
+									common.Log.Debug("fontFragmentTest: %s", f.description)
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+									numObj, err := parsePdfFragment(f.filename)
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									if err != nil {
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+										t.Errorf("Failed to parse. %s err=%v", f, err)
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+										return
 									}
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+									fontObj := numObj[f.objNum]
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									font, err := model.NewPdfFontFromPdfObject(fontObj)
 									if err != nil {
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+										t.Errorf("Failed to create font. %s err=%v", f, err)
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+										return
 									}
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+									actualText, numChars, numMisses := font.CharcodeBytesToUnicode(f.data)
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									if numMisses != 0 {
 										t.Errorf("Some codes not decoded. numMisses=%d", numMisses)
 										return
 									}
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+									if actualText != f.expected {
 										t.Errorf("Incorrect decoding. %s\nexpected=%q\n  actual=%q",
 											f, f.expected, actualText)
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									}
-												Added a test for CharcodeBytesToUnicode for Type0 ToUnicode cmaps

											
										
										
											2018-07-19 10:28:23 +10:00
+									if numChars != len([]rune(actualText)) {
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+										t.Errorf("Incorrect numChars. %s numChars=%d expected=%d",
 											f, numChars, len(actualText))
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									}
 								}
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+								// objFontObj parses `fontDict` to a make a Font, creates a PDF object from the Font and checks that
 								// the new PDF object is the same as the input object
 								func objFontObj(t *testing.T, fontDict string) error {
-												Don't import core anonymously

											
										
										
											2018-07-15 17:29:27 +10:00
+									parser := core.NewParserFromString(fontDict)
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+									obj, err := parser.ParseDict()
 									if err != nil {
 										t.Errorf("objFontObj: Failed to parse dict obj. fontDict=%q err=%v", fontDict, err)
 										return err
 									}
-												Add basic test cases

											
										
										
											2018-07-09 18:01:22 +10:00
+									font, err := model.NewPdfFontFromPdfObject(obj)
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+									if err != nil {
 										t.Errorf("Failed to parse font object. obj=%s err=%v", obj, err)
 										return err
 									}
 									// Resolve all the indirect references in the font objects so we can compare their contents.
-												Don't import core anonymously

											
										
										
											2018-07-15 17:29:27 +10:00
+									obj1 := core.FlattenObject(obj)
 									obj2 := core.FlattenObject(font.ToPdfObject())
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
-												Simplified font.go. Made ToUnicode cmap private. Removed duplicate ToUnicode from Type0 font

											
										
										
											2018-06-28 11:06:23 +10:00
+									// Check that the reconstituted font is the same as the original.
-												Don't import core anonymously

											
										
										
											2018-07-15 17:29:27 +10:00
+									if !core.EqualObjects(obj1, obj2) {
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+										t.Errorf("Different objects.\nobj1=%s\nobj2=%s\nfont=%s", obj1, obj2, font)
 										return errors.New("different objects")
 									}
-												Simplified font.go. Made ToUnicode cmap private. Removed duplicate ToUnicode from Type0 font

											
										
										
											2018-06-28 11:06:23 +10:00
-												Major changes to font code
- Added Type1 font parsing.
- Added Standard 14 font parsing.
- Fixed some bugs in cmap code.
- Started re-structuring of font code. Moved common font fields to `fontSkeleton`

											
										
										
											2018-06-27 12:25:59 +10:00
+									return nil
 								}
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
-												fixed comments

											
										
										
											2018-07-18 14:50:52 +10:00
+								// parsePdfFragment parses a file containing fragments of a PDF `filename` (see
 								// charcodeBytesToUnicodeTest) and returns a map of {object number: object} with indirect objects
 								// replaced by their values if they are in `filename`.
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+								func parsePdfFragment(filename string) (map[int]core.PdfObject, error) {
 									data, err := ioutil.ReadFile(filename)
 									if err != nil {
 										return nil, err
 									}
 									return parsePdfObjects(string(data))
 								}
-												fixed comments

											
										
										
											2018-07-18 14:50:52 +10:00
+								// parsePdfObjects parses a fragment of a PDF `text` and returns a map of {object number: object}
 								// with indirect objects replaced by their values if they are in `text`.
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+								func parsePdfObjects(text string) (map[int]core.PdfObject, error) {
 									numObj := map[int]core.PdfObject{}
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									parser := core.NewParserFromString(text)
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
 									// Build the numObj {object number: object} map
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+									nums := []int{}
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+									for {
 										obj, err := parser.ParseIndirectObject()
 										if err != nil {
 											if err == io.EOF {
 												break
 											}
 											return numObj, err
 										}
 										switch t := obj.(type) {
 										case *core.PdfIndirectObject:
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+											numObj[int(t.ObjectNumber)] = obj
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+											nums = append(nums, int(t.ObjectNumber))
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+										case *core.PdfObjectStream:
-												Added a test for Type1 FontFile decoding

											
										
										
											2018-07-18 14:30:43 +10:00
+											numObj[int(t.ObjectNumber)] = obj
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+											nums = append(nums, int(t.ObjectNumber))
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+										}
 									}
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+									common.Log.Debug("parsePdfObjects: Parsed %d objects %+v", len(numObj), nums)
-												Added a test for CharcodeBytesToUnicode for Type0 ToUnicode cmaps

											
										
										
											2018-07-19 10:28:23 +10:00
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+									// Replace the indirect objects in all dicts and arrays with their values, if they are in numObj.
 									for n, obj := range numObj {
 										common.Log.Debug("-- 0 %d obj %T", n, obj)
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+										iobj, ok := obj.(*core.PdfIndirectObject)
 										if !ok {
 											continue
 										}
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+										common.Log.Debug("   -- %T", iobj.PdfObject)
 										iobj.PdfObject, ok = replaceReferences(numObj, iobj.PdfObject)
 										if !ok {
 											common.Log.Debug("ERROR: unresolved reference")
 										}
 									}
 									return numObj, nil
 								}
 								// replaceReferences replaces the object references in all dicts and arrays with their values, if
 								// they are in numObj. The boolean return is true if all object references were successfuly
 								// replaced.
 								func replaceReferences(numObj map[int]core.PdfObject, obj core.PdfObject) (core.PdfObject, bool) {
 									var ok bool
 									switch t := obj.(type) {
 									case *core.PdfObjectReference:
 										o, ok := numObj[int(t.ObjectNumber)]
 										common.Log.Debug("    %d 0 R  %t ", t.ObjectNumber, ok)
 										return o, ok
 									case *core.PdfObjectDictionary:
 										for _, k := range t.Keys() {
 											o := t.Get(k)
 											o, ok = replaceReferences(numObj, o)
 											if !ok {
 												return o, ok
-												Added a test for CharcodeBytesToUnicode for Type0 ToUnicode cmaps

											
										
										
											2018-07-19 10:28:23 +10:00
+											}
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+											t.Set(k, o)
 										}
 									case *core.PdfObjectArray:
 										for i, o := range *t {
 											o, ok = replaceReferences(numObj, o)
 											if !ok {
 												return o, ok
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+											}
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+											(*t)[i] = o
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+										}
 									}
-												Added a test for cmap beginbfchar and beginbfrange entries

											
										
										
											2018-07-20 11:39:41 +10:00
+									return obj, true
-												Added a test for CharcodeBytesToUnicode for TrueType fonts with ToUnicode cmaps

											
										
										
											2018-07-17 17:43:11 +10:00
+								}