unipdf/internal/jbig2/tests/encode_test.go

204 lines
5.0 KiB
Go
Raw Normal View History

JBIG2 Generic Encoder (#264) * Prepared skeleton and basic component implementations for the jbig2 encoding. * Added Bitset. Implemented Bitmap. * Decoder with old Arithmetic Decoder * Partly working arithmetic * Working arithmetic decoder. * MMR patched. * rebuild to apache. * Working generic * Working generic * Decoded full document * Update Jenkinsfile go version [master] (#398) * Update Jenkinsfile go version * Decoded AnnexH document * Minor issues fixed. * Update README.md * Fixed generic region errors. Added benchmark. Added bitmap unpadder. Added Bitmap toImage method. * Fixed endofpage error * Added integration test. * Decoded all test files without errors. Implemented JBIG2Global. * Merged with v3 version * Fixed the EOF in the globals issue * Fixed the JBIG2 ChocolateData Decode * JBIG2 Added license information * Minor fix in jbig2 encoding. * Applied the logging convention * Cleaned unnecessary imports * Go modules clear unused imports * checked out the README.md * Moved trace to Debug. Fixed the build integrate tag in the document_decode_test.go * Initial encoder skeleton * Applied UniPDF Developer Guide. Fixed lint issues. * Cleared documentation, fixed style issues. * Added jbig2 doc.go files. Applied unipdf guide style. * Minor code style changes. * Minor naming and style issues fixes. * Minor naming changes. Style issues fixed. * Review r11 fixes. * Added JBIG2 Encoder skeleton. * Moved Document and Page to jbig2/document package. Created decoder package responsible for decoding jbig2 stream. * Implemented raster functions. * Added raster uni low test funcitons. * Added raster low test functions * untracked files on jbig2-encoder: c869089 Added raster low test functions * index on jbig2-encoder: c869089 Added raster low test functions * Added morph files. * implemented jbig2 encoder basics * JBIG2 Encoder - Generic method * Added jbig2 image encode ttests, black/white image tests * cleaned and tested jbig2 package * unfinished jbig2 classified encoder * jbig2 minor style changes * minor jbig2 encoder changes * prepared JBIG2 Encoder * Style and lint fixes * Minor changes and lints * Fixed shift unsinged value build errors * Minor naming change * Added jbig2 encode, image gondels. Fixed jbig2 decode bug. * Provided jbig2 core.DecodeGlobals function. * Fixed JBIG2Encoder `r6` revision issues. * Removed public JBIG2Encoder document. * Minor style changes * added NewJBIG2Encoder function. * fixed JBIG2Encoder 'r9' revision issues. * Cleared 'r9' commented code. * Updated ACKNOWLEDGEMENETS. Fixed JBIG2Encoder 'r10' revision issues. Co-authored-by: Gunnsteinn Hall <gunnsteinn.hall@gmail.com>
2020-03-27 12:47:41 +01:00
/*
* This file is subject to the terms and conditions defined in
* file 'LICENSE.md', which is part of this source code package.
*/
package tests
import (
"archive/zip"
"bytes"
"crypto/md5"
"fmt"
"image"
"image/jpeg"
"os"
"path/filepath"
"strings"
"testing"
"time"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
"github.com/unidoc/unipdf/v3/common"
"github.com/unidoc/unipdf/v3/core"
)
// TestImageEncodeDecodeJBIG2 tests the encode and decode process for the JBIG2 encoder.
func TestImageEncodeDecodeJBIG2(t *testing.T) {
dirName := os.Getenv(EnvImageDirectory)
if dirName == "" {
t.Skipf("no environment variable: '%s' provided", EnvImageDirectory)
}
// get the file names within given directory
fileNames, err := readFileNames(dirName, "jpg")
require.NoError(t, err)
if len(fileNames) == 0 {
t.Skipf("no files found in the '%s' directory", dirName)
}
// prepare temporary directory where the jbig2 files would be stored
tempDir := filepath.Join(os.TempDir(), "unipdf", "jbig2", "encoded-decoded")
err = os.MkdirAll(tempDir, 0700)
require.NoError(t, err)
var f *os.File
switch {
case logToFile:
fileName := filepath.Join(tempDir, fmt.Sprintf("log_%s.txt", time.Now().Format("20060102")))
f, err = os.Create(fileName)
require.NoError(t, err)
common.SetLogger(common.NewWriterLogger(common.LogLevelTrace, f))
case testing.Verbose():
common.SetLogger(common.NewConsoleLogger(common.LogLevelDebug))
}
// clear all the temporary files
defer func() {
if f != nil {
f.Close()
}
switch {
case !keepImageFiles && !logToFile:
err = os.RemoveAll(filepath.Join(tempDir))
case !keepImageFiles:
err = filepath.Walk(tempDir, func(path string, info os.FileInfo, err error) error {
if err != nil {
return err
}
if strings.HasSuffix(info.Name(), "zip") {
return os.Remove(path)
}
return nil
})
}
if err != nil {
common.Log.Error(err.Error())
}
}()
defer func() {
if !keepImageFiles {
os.RemoveAll(tempDir)
}
}()
buf := &bytes.Buffer{}
h := md5.New()
edp := []goldenValuePair{}
for _, fileName := range fileNames {
// read the file
f, err := getFile(dirName, fileName)
require.NoError(t, err)
defer f.Close()
// try to read the file as image.
img, _, err := image.Decode(f)
if err != nil {
// if the image is of unknown decoding or is not an image skip the test.
common.Log.Debug("File: '%s' couldn't be read as an image")
continue
}
rawName := rawFileName(fileName)
t.Run(rawName, func(t *testing.T) {
zipFileName := filepath.Join(tempDir, rawName+".zip")
// create zip file containing encoded images
zf, err := os.Create(zipFileName)
require.NoError(t, err)
defer zf.Close()
// wrap zip writer over the file writer.
zw := zip.NewWriter(zf)
defer zw.Close()
// convert the input image into jbig2 1bpp acceptable binary image.
jimg, err := core.GoImageToJBIG2(img, core.JB2ImageAutoThreshold)
require.NoError(t, err)
// create the encoder
e := &core.JBIG2Encoder{}
err = e.AddPageImage(jimg, &core.JBIG2EncoderSettings{DuplicatedLinesRemoval: true, FileMode: true})
require.NoError(t, err)
data, err := e.Encode()
require.NoError(t, err)
if keepEncodedFile {
// create .jbig2 file within the zip file
jbf, err := zw.Create(rawName + ".jbig2")
require.NoError(t, err)
// write encoded data into jb2 file
_, err = jbf.Write(data)
require.NoError(t, err)
}
// create golang image and store it within zip file
bwImage, err := jimg.ToGoImage()
require.NoError(t, err)
buf.Reset()
// store the binary image in the 'jpeg' format.
err = jpeg.Encode(buf, bwImage, &jpeg.Options{Quality: jpeg.DefaultQuality})
require.NoError(t, err)
// write images if the flag is set to true
if keepImageFiles {
// create a jpeg file to show the black white image.
df, err := zw.Create(rawName + ".jpg")
require.NoError(t, err)
_, err = buf.WriteTo(df)
require.NoError(t, err)
}
h.Reset()
_, err = h.Write(buf.Bytes())
require.NoError(t, err)
hashOrig := h.Sum(nil)
// decode the encoded data and store it's results in the zipped file.
d := &core.JBIG2Encoder{}
decoded, err := d.DecodeImages(data)
require.NoError(t, err)
require.Len(t, decoded, 1)
// reset buffer
buf.Reset()
h.Reset()
// write the decoded image
err = jpeg.Encode(buf, decoded[0], &jpeg.Options{Quality: jpeg.DefaultQuality})
require.NoError(t, err)
_, err = h.Write(buf.Bytes())
require.NoError(t, err)
if keepImageFiles {
// create decoded image file within the zip file.
dimg, err := zw.Create(rawName + "_encdec.jpg")
require.NoError(t, err)
_, err = buf.WriteTo(dimg)
require.NoError(t, err)
}
hashEncoded := h.Sum(nil)
assert.True(t, bytes.Equal(hashOrig, hashEncoded))
edp = append(edp, goldenValuePair{
Filename: fileName,
Hash: hashEncoded,
})
})
}
const goldenFileName = "encoded-decoded"
checkGoldenValuePairs(t, dirName, goldenFileName, edp...)
}