mirror of
https://github.com/unidoc/unipdf.git
synced 2025-04-27 13:48:51 +08:00

* Prepared skeleton and basic component implementations for the jbig2 encoding. * Added Bitset. Implemented Bitmap. * Decoder with old Arithmetic Decoder * Partly working arithmetic * Working arithmetic decoder. * MMR patched. * rebuild to apache. * Working generic * Working generic * Decoded full document * Update Jenkinsfile go version [master] (#398) * Update Jenkinsfile go version * Decoded AnnexH document * Minor issues fixed. * Update README.md * Fixed generic region errors. Added benchmark. Added bitmap unpadder. Added Bitmap toImage method. * Fixed endofpage error * Added integration test. * Decoded all test files without errors. Implemented JBIG2Global. * Merged with v3 version * Fixed the EOF in the globals issue * Fixed the JBIG2 ChocolateData Decode * JBIG2 Added license information * Minor fix in jbig2 encoding. * Applied the logging convention * Cleaned unnecessary imports * Go modules clear unused imports * checked out the README.md * Moved trace to Debug. Fixed the build integrate tag in the document_decode_test.go * Initial encoder skeleton * Applied UniPDF Developer Guide. Fixed lint issues. * Cleared documentation, fixed style issues. * Added jbig2 doc.go files. Applied unipdf guide style. * Minor code style changes. * Minor naming and style issues fixes. * Minor naming changes. Style issues fixed. * Review r11 fixes. * Added JBIG2 Encoder skeleton. * Moved Document and Page to jbig2/document package. Created decoder package responsible for decoding jbig2 stream. * Implemented raster functions. * Added raster uni low test funcitons. * Added raster low test functions * untracked files on jbig2-encoder: c869089 Added raster low test functions * index on jbig2-encoder: c869089 Added raster low test functions * Added morph files. * implemented jbig2 encoder basics * JBIG2 Encoder - Generic method * Added jbig2 image encode ttests, black/white image tests * cleaned and tested jbig2 package * unfinished jbig2 classified encoder * jbig2 minor style changes * minor jbig2 encoder changes * prepared JBIG2 Encoder * Style and lint fixes * Minor changes and lints * Fixed shift unsinged value build errors * Minor naming change * Added jbig2 encode, image gondels. Fixed jbig2 decode bug. * Provided jbig2 core.DecodeGlobals function. * Fixed JBIG2Encoder `r6` revision issues. * Removed public JBIG2Encoder document. * Minor style changes * added NewJBIG2Encoder function. * fixed JBIG2Encoder 'r9' revision issues. * Cleared 'r9' commented code. * Updated ACKNOWLEDGEMENETS. Fixed JBIG2Encoder 'r10' revision issues. Co-authored-by: Gunnsteinn Hall <gunnsteinn.hall@gmail.com>
204 lines
5.0 KiB
Go
204 lines
5.0 KiB
Go
/*
|
|
* This file is subject to the terms and conditions defined in
|
|
* file 'LICENSE.md', which is part of this source code package.
|
|
*/
|
|
|
|
package tests
|
|
|
|
import (
|
|
"archive/zip"
|
|
"bytes"
|
|
"crypto/md5"
|
|
"fmt"
|
|
"image"
|
|
"image/jpeg"
|
|
"os"
|
|
"path/filepath"
|
|
"strings"
|
|
"testing"
|
|
"time"
|
|
|
|
"github.com/stretchr/testify/assert"
|
|
"github.com/stretchr/testify/require"
|
|
|
|
"github.com/unidoc/unipdf/v3/common"
|
|
"github.com/unidoc/unipdf/v3/core"
|
|
)
|
|
|
|
// TestImageEncodeDecodeJBIG2 tests the encode and decode process for the JBIG2 encoder.
|
|
func TestImageEncodeDecodeJBIG2(t *testing.T) {
|
|
dirName := os.Getenv(EnvImageDirectory)
|
|
if dirName == "" {
|
|
t.Skipf("no environment variable: '%s' provided", EnvImageDirectory)
|
|
}
|
|
|
|
// get the file names within given directory
|
|
fileNames, err := readFileNames(dirName, "jpg")
|
|
require.NoError(t, err)
|
|
|
|
if len(fileNames) == 0 {
|
|
t.Skipf("no files found in the '%s' directory", dirName)
|
|
}
|
|
|
|
// prepare temporary directory where the jbig2 files would be stored
|
|
tempDir := filepath.Join(os.TempDir(), "unipdf", "jbig2", "encoded-decoded")
|
|
err = os.MkdirAll(tempDir, 0700)
|
|
require.NoError(t, err)
|
|
|
|
var f *os.File
|
|
switch {
|
|
case logToFile:
|
|
fileName := filepath.Join(tempDir, fmt.Sprintf("log_%s.txt", time.Now().Format("20060102")))
|
|
f, err = os.Create(fileName)
|
|
require.NoError(t, err)
|
|
common.SetLogger(common.NewWriterLogger(common.LogLevelTrace, f))
|
|
case testing.Verbose():
|
|
common.SetLogger(common.NewConsoleLogger(common.LogLevelDebug))
|
|
}
|
|
|
|
// clear all the temporary files
|
|
defer func() {
|
|
if f != nil {
|
|
f.Close()
|
|
}
|
|
|
|
switch {
|
|
case !keepImageFiles && !logToFile:
|
|
err = os.RemoveAll(filepath.Join(tempDir))
|
|
case !keepImageFiles:
|
|
err = filepath.Walk(tempDir, func(path string, info os.FileInfo, err error) error {
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if strings.HasSuffix(info.Name(), "zip") {
|
|
return os.Remove(path)
|
|
}
|
|
return nil
|
|
})
|
|
}
|
|
if err != nil {
|
|
common.Log.Error(err.Error())
|
|
}
|
|
}()
|
|
|
|
defer func() {
|
|
if !keepImageFiles {
|
|
os.RemoveAll(tempDir)
|
|
}
|
|
}()
|
|
|
|
buf := &bytes.Buffer{}
|
|
h := md5.New()
|
|
edp := []goldenValuePair{}
|
|
for _, fileName := range fileNames {
|
|
// read the file
|
|
f, err := getFile(dirName, fileName)
|
|
require.NoError(t, err)
|
|
defer f.Close()
|
|
|
|
// try to read the file as image.
|
|
img, _, err := image.Decode(f)
|
|
if err != nil {
|
|
// if the image is of unknown decoding or is not an image skip the test.
|
|
common.Log.Debug("File: '%s' couldn't be read as an image")
|
|
continue
|
|
}
|
|
rawName := rawFileName(fileName)
|
|
|
|
t.Run(rawName, func(t *testing.T) {
|
|
zipFileName := filepath.Join(tempDir, rawName+".zip")
|
|
// create zip file containing encoded images
|
|
zf, err := os.Create(zipFileName)
|
|
require.NoError(t, err)
|
|
defer zf.Close()
|
|
|
|
// wrap zip writer over the file writer.
|
|
zw := zip.NewWriter(zf)
|
|
defer zw.Close()
|
|
|
|
// convert the input image into jbig2 1bpp acceptable binary image.
|
|
jimg, err := core.GoImageToJBIG2(img, core.JB2ImageAutoThreshold)
|
|
require.NoError(t, err)
|
|
|
|
// create the encoder
|
|
e := &core.JBIG2Encoder{}
|
|
err = e.AddPageImage(jimg, &core.JBIG2EncoderSettings{DuplicatedLinesRemoval: true, FileMode: true})
|
|
require.NoError(t, err)
|
|
|
|
data, err := e.Encode()
|
|
require.NoError(t, err)
|
|
|
|
if keepEncodedFile {
|
|
// create .jbig2 file within the zip file
|
|
jbf, err := zw.Create(rawName + ".jbig2")
|
|
require.NoError(t, err)
|
|
|
|
// write encoded data into jb2 file
|
|
_, err = jbf.Write(data)
|
|
require.NoError(t, err)
|
|
}
|
|
|
|
// create golang image and store it within zip file
|
|
bwImage, err := jimg.ToGoImage()
|
|
require.NoError(t, err)
|
|
|
|
buf.Reset()
|
|
|
|
// store the binary image in the 'jpeg' format.
|
|
err = jpeg.Encode(buf, bwImage, &jpeg.Options{Quality: jpeg.DefaultQuality})
|
|
require.NoError(t, err)
|
|
|
|
// write images if the flag is set to true
|
|
if keepImageFiles {
|
|
// create a jpeg file to show the black white image.
|
|
df, err := zw.Create(rawName + ".jpg")
|
|
require.NoError(t, err)
|
|
|
|
_, err = buf.WriteTo(df)
|
|
require.NoError(t, err)
|
|
}
|
|
h.Reset()
|
|
_, err = h.Write(buf.Bytes())
|
|
require.NoError(t, err)
|
|
|
|
hashOrig := h.Sum(nil)
|
|
|
|
// decode the encoded data and store it's results in the zipped file.
|
|
d := &core.JBIG2Encoder{}
|
|
decoded, err := d.DecodeImages(data)
|
|
require.NoError(t, err)
|
|
require.Len(t, decoded, 1)
|
|
|
|
// reset buffer
|
|
buf.Reset()
|
|
h.Reset()
|
|
|
|
// write the decoded image
|
|
err = jpeg.Encode(buf, decoded[0], &jpeg.Options{Quality: jpeg.DefaultQuality})
|
|
require.NoError(t, err)
|
|
|
|
_, err = h.Write(buf.Bytes())
|
|
require.NoError(t, err)
|
|
|
|
if keepImageFiles {
|
|
// create decoded image file within the zip file.
|
|
dimg, err := zw.Create(rawName + "_encdec.jpg")
|
|
require.NoError(t, err)
|
|
|
|
_, err = buf.WriteTo(dimg)
|
|
require.NoError(t, err)
|
|
}
|
|
|
|
hashEncoded := h.Sum(nil)
|
|
assert.True(t, bytes.Equal(hashOrig, hashEncoded))
|
|
|
|
edp = append(edp, goldenValuePair{
|
|
Filename: fileName,
|
|
Hash: hashEncoded,
|
|
})
|
|
})
|
|
}
|
|
const goldenFileName = "encoded-decoded"
|
|
checkGoldenValuePairs(t, dirName, goldenFileName, edp...)
|
|
}
|