Files
caire/process.go

397 lines
11 KiB
Go

package caire
import (
"embed"
"fmt"
"image"
"image/color"
"image/color/palette"
"image/draw"
"image/gif"
"image/jpeg"
"image/png"
"io"
"math"
"os"
"path/filepath"
"github.com/disintegration/imaging"
pigo "github.com/esimov/pigo/core"
"github.com/pkg/errors"
"golang.org/x/image/bmp"
)
//go:embed data/facefinder
var classifier embed.FS
var (
g *gif.GIF
xCount int
yCount int
isGif = false
)
// SeamCarver interface defines the Resize method.
// This needs to be implemented by every struct which declares a Resize method.
type SeamCarver interface {
Resize(*image.NRGBA) (image.Image, error)
}
// Processor options
type Processor struct {
SobelThreshold int
BlurRadius int
NewWidth int
NewHeight int
Percentage bool
Square bool
Debug bool
FaceDetect bool
FaceAngle float64
PigoFaceDetector *pigo.Pigo
}
// Resize implements the Resize method of the Carver interface.
// It returns the concrete resize operation method.
func Resize(s SeamCarver, img *image.NRGBA) (image.Image, error) {
return s.Resize(img)
}
// Resize method takes the source image and rescales it using the parameters provided.
// The new image can be rescaled either horizontally or vertically (or both).
// Depending on the provided parameters the image can be either reduced or enlarged.
func (p *Processor) Resize(img *image.NRGBA) (image.Image, error) {
var c = NewCarver(img.Bounds().Dx(), img.Bounds().Dy())
var (
newImg image.Image
newWidth int
newHeight int
pw, ph int
err error
)
xCount, yCount = 0, 0
if p.NewWidth > c.Width {
newWidth = p.NewWidth - (p.NewWidth - (p.NewWidth - c.Width))
} else {
newWidth = c.Width - (c.Width - (c.Width - p.NewWidth))
}
if p.NewHeight > c.Height {
newHeight = p.NewHeight - (p.NewHeight - (p.NewHeight - c.Height))
} else {
newHeight = c.Height - (c.Height - (c.Height - p.NewHeight))
}
if p.NewWidth == 0 {
newWidth = p.NewWidth
}
if p.NewHeight == 0 {
newHeight = p.NewHeight
}
reduce := func() error {
width, height := img.Bounds().Max.X, img.Bounds().Max.Y
c = NewCarver(width, height)
if err := c.ComputeSeams(img, p); err != nil {
return err
}
seams := c.FindLowestEnergySeams()
img = c.RemoveSeam(img, seams, p.Debug)
if isGif {
g = encodeImageToGif(img)
}
return nil
}
enlarge := func() error {
width, height := img.Bounds().Max.X, img.Bounds().Max.Y
c = NewCarver(width, height)
if err := c.ComputeSeams(img, p); err != nil {
return err
}
seams := c.FindLowestEnergySeams()
img = c.AddSeam(img, seams, p.Debug)
return nil
}
if p.Percentage || p.Square {
// When square option is used the image will be resized to a square based on the shortest edge.
pw = c.Width - c.Height
ph = c.Height - c.Width
// In case pw and ph is zero, it means that the target image is square.
// In this case we don't have to apply the seam carving algorithm, we can simply resize the image.
if pw == 0 && ph == 0 {
return imaging.Resize(img, p.NewWidth, 0, imaging.Lanczos), nil
}
if p.Square {
if p.NewWidth < p.NewHeight {
newImg = imaging.Resize(img, p.NewWidth, 0, imaging.Lanczos)
} else {
newImg = imaging.Resize(img, p.NewHeight, 0, imaging.Lanczos)
}
dst := image.NewNRGBA(newImg.Bounds())
draw.Draw(dst, newImg.Bounds(), newImg, image.ZP, draw.Src)
img = dst
nw, nh := img.Bounds().Dx(), img.Bounds().Dy()
if nw > nh {
pw = nw - nh
ph = 0
} else {
ph = nh - nw
pw = 0
}
}
if p.Percentage {
// Calculate new sizes based on provided percentage.
pw = c.Width - int(float64(c.Width)-(float64(p.NewWidth)/100*float64(c.Width)))
ph = c.Height - int(float64(c.Height)-(float64(p.NewHeight)/100*float64(c.Height)))
if pw > newWidth || ph > newHeight {
return nil, errors.New("the generated image size should be less than the original image size")
}
}
// Reduce image size horizontally
for x := 0; x < pw; x++ {
if err = reduce(); err != nil {
return nil, err
}
xCount++
}
// Reduce image size vertically
img = c.RotateImage90(img)
for y := 0; y < ph; y++ {
if err = reduce(); err != nil {
return nil, err
}
yCount++
}
img = c.RotateImage270(img)
} else if newWidth > 0 || newHeight > 0 {
// We are trying to rescale the image proportionally prior resizing.
// First the image is scaled down or up by preserving the image aspect ratio,
// then the seam carving algorithm is applied only to the remaining pixels.
// Scale the width and height by the smaller factor (i.e Min(wScaleFactor, hScaleFactor))
// Example: input: 5000x2500, scale: 2160x1080, final target: 1920x1080
wScaleFactor := float64(c.Width) / float64(p.NewWidth)
hScaleFactor := float64(c.Height) / float64(p.NewHeight)
scaleWidth := math.Round(float64(c.Width) / math.Min(wScaleFactor, hScaleFactor))
scaleHeight := math.Round(float64(c.Height) / math.Min(wScaleFactor, hScaleFactor))
newImg = imaging.Resize(img, int(scaleWidth), int(scaleHeight), imaging.Lanczos)
dx0, dy0 := img.Bounds().Max.X, newImg.Bounds().Max.Y
dx1, dy1 := newImg.Bounds().Max.X, newImg.Bounds().Max.Y
// Rescale the image only when it's resized both horizontally and vertically
// and the new image width or height are preserved, otherwise it might happen, that
// the generated image size does not match with the requested image size.
if !((p.NewWidth == 0 && dx0 == dx1) || (p.NewHeight == 0 && dy0 == dy1)) {
// The amount needed to remove by carving. One or both of these will be 0.
newWidth = int(scaleWidth) - p.NewWidth
newHeight = int(scaleHeight) - p.NewHeight
dst := image.NewNRGBA(newImg.Bounds())
draw.Draw(dst, newImg.Bounds(), newImg, image.ZP, draw.Src)
img = dst
}
// Run the carver function if the desired image width is not identical with the rescaled image width.
if newWidth > 0 && newWidth != img.Bounds().Max.X {
// Because of scaling horizontally and vertically at the same time it might happen
// that the scaled image exceeds the desired image size, we need to make sure
// that the new width and|or height is reduced and not enlarged.
if p.NewWidth > c.Width && img.Bounds().Max.X < p.NewWidth {
for x := 0; x < newWidth; x++ {
if err = enlarge(); err != nil {
return nil, err
}
}
} else {
for x := 0; x < newWidth; x++ {
if err = reduce(); err != nil {
return nil, err
}
xCount++
}
}
}
// Run the carver function if the desired image height is not identical with the rescaled image height.
if newHeight > 0 && newHeight != img.Bounds().Max.Y {
img = c.RotateImage90(img)
// Check new height against the width of the image because the image is rotated 90deg.
if p.NewHeight > c.Height && img.Bounds().Max.X < p.NewHeight {
for y := 0; y < newHeight; y++ {
if err = enlarge(); err != nil {
return nil, err
}
}
} else {
for y := 0; y < newHeight; y++ {
if err = reduce(); err != nil {
return nil, err
}
}
}
img = c.RotateImage270(img)
}
}
return img, nil
}
// Process encodes the resized image into an io.Writer interface.
// We are using the io package, because this way we can provide different input and output types,
// as long as they implement the io.Reader and io.Writer interface.
func (p *Processor) Process(r io.Reader, w io.Writer) error {
var err error
// Instantiate a new Pigo object in case the face detection option is used.
p.PigoFaceDetector = pigo.NewPigo()
if p.FaceDetect {
cascadeFile, err := classifier.ReadFile("data/facefinder")
if err != nil {
return errors.New(fmt.Sprintf("error reading the cascade file: %v", err))
}
// Unpack the binary file. This will return the number of cascade trees,
// the tree depth, the threshold and the prediction from tree's leaf nodes.
p.PigoFaceDetector, err = p.PigoFaceDetector.Unpack(cascadeFile)
if err != nil {
return errors.New(fmt.Sprintf("Error reading the cascade file: %v\n", err))
}
}
g = new(gif.GIF)
src, _, err := image.Decode(r)
if err != nil {
return err
}
img := imgToNRGBA(src)
switch w.(type) {
case *os.File:
ext := filepath.Ext(w.(*os.File).Name())
switch ext {
case "", ".jpg", ".jpeg":
res, err := Resize(p, img)
if err != nil {
return err
}
return jpeg.Encode(w, res, &jpeg.Options{Quality: 100})
case ".png":
res, err := Resize(p, img)
if err != nil {
return err
}
return png.Encode(w, res)
case ".bmp":
res, err := Resize(p, img)
if err != nil {
return err
}
return bmp.Encode(w, res)
case ".gif":
isGif = true
_, err := Resize(p, img)
if err != nil {
return err
}
return writeGifToFile(w.(*os.File).Name())
default:
return errors.New("unsupported image format")
}
default:
res, err := Resize(p, img)
if err != nil {
return err
}
return jpeg.Encode(w, res, &jpeg.Options{Quality: 100})
}
return nil
}
// imgToNRGBA converts any image type to *image.NRGBA with min-point at (0, 0).
func imgToNRGBA(img image.Image) *image.NRGBA {
srcBounds := img.Bounds()
if srcBounds.Min.X == 0 && srcBounds.Min.Y == 0 {
if src0, ok := img.(*image.NRGBA); ok {
return src0
}
}
srcMinX := srcBounds.Min.X
srcMinY := srcBounds.Min.Y
dstBounds := srcBounds.Sub(srcBounds.Min)
dstW := dstBounds.Dx()
dstH := dstBounds.Dy()
dst := image.NewNRGBA(dstBounds)
switch src := img.(type) {
case *image.NRGBA:
rowSize := srcBounds.Dx() * 4
for dstY := 0; dstY < dstH; dstY++ {
di := dst.PixOffset(0, dstY)
si := src.PixOffset(srcMinX, srcMinY+dstY)
for dstX := 0; dstX < dstW; dstX++ {
copy(dst.Pix[di:di+rowSize], src.Pix[si:si+rowSize])
}
}
case *image.YCbCr:
for dstY := 0; dstY < dstH; dstY++ {
di := dst.PixOffset(0, dstY)
for dstX := 0; dstX < dstW; dstX++ {
srcX := srcMinX + dstX
srcY := srcMinY + dstY
siy := src.YOffset(srcX, srcY)
sic := src.COffset(srcX, srcY)
r, g, b := color.YCbCrToRGB(src.Y[siy], src.Cb[sic], src.Cr[sic])
dst.Pix[di+0] = r
dst.Pix[di+1] = g
dst.Pix[di+2] = b
dst.Pix[di+3] = 0xff
di += 4
}
}
default:
for dstY := 0; dstY < dstH; dstY++ {
di := dst.PixOffset(0, dstY)
for dstX := 0; dstX < dstW; dstX++ {
c := color.NRGBAModel.Convert(img.At(srcMinX+dstX, srcMinY+dstY)).(color.NRGBA)
dst.Pix[di+0] = c.R
dst.Pix[di+1] = c.G
dst.Pix[di+2] = c.B
dst.Pix[di+3] = c.A
di += 4
}
}
}
return dst
}
// encodeImageToGif encodes the provided image to a Gif file.
func encodeImageToGif(src image.Image) *gif.GIF {
bounds := src.Bounds()
dst := image.NewPaletted(image.Rect(0, 0, bounds.Dx()-xCount, bounds.Dy()-yCount), palette.Plan9)
draw.Draw(dst, src.Bounds(), src, image.Point{}, draw.Src)
g.Image = append(g.Image, dst)
g.Delay = append(g.Delay, 0)
return g
}
// writeGifToFile writes the encoded Gif file to the destination file.
func writeGifToFile(path string) error {
f, err := os.Create(path)
if err != nil {
return err
}
defer f.Close()
return gif.EncodeAll(f, g)
}