mirror of
https://github.com/esimov/caire.git
synced 2025-09-26 20:41:14 +08:00
465 lines
12 KiB
Go
465 lines
12 KiB
Go
package caire
|
|
|
|
import (
|
|
"image"
|
|
"image/color"
|
|
"image/draw"
|
|
"math"
|
|
|
|
pigo "github.com/esimov/pigo/core"
|
|
)
|
|
|
|
// maxFaceDetAttempts defines the maximum number of attempts of face detections,
|
|
const maxFaceDetAttempts = 20
|
|
|
|
var (
|
|
usedSeams []UsedSeams
|
|
detAttempts int
|
|
)
|
|
|
|
// Carver is the main entry struct having as parameters the newly generated image width, height and seam points.
|
|
type Carver struct {
|
|
Width int
|
|
Height int
|
|
Points []float64
|
|
Seams []Seam
|
|
}
|
|
|
|
// Seam struct contains the seam pixel coordinates.
|
|
type Seam struct {
|
|
X int
|
|
Y int
|
|
}
|
|
|
|
// UsedSeams contains the already generated seams.
|
|
type UsedSeams struct {
|
|
ActiveSeam []ActiveSeam
|
|
}
|
|
|
|
// ActiveSeam contains the current seam position and color.
|
|
type ActiveSeam struct {
|
|
Seam
|
|
Pix color.Color
|
|
}
|
|
|
|
// NewCarver returns an initialized Carver structure.
|
|
func NewCarver(width, height int) *Carver {
|
|
return &Carver{
|
|
width,
|
|
height,
|
|
make([]float64, width*height),
|
|
nil,
|
|
}
|
|
}
|
|
|
|
// Get energy pixel value.
|
|
func (c *Carver) get(x, y int) float64 {
|
|
px := x + y*c.Width
|
|
return c.Points[px]
|
|
}
|
|
|
|
// Set energy pixel value.
|
|
func (c *Carver) set(x, y int, px float64) {
|
|
idx := x + y*c.Width
|
|
c.Points[idx] = px
|
|
}
|
|
|
|
// ComputeSeams compute the minimum energy level based on the following logic:
|
|
// - traverse the image from the second row to the last row
|
|
// and compute the cumulative minimum energy M for all possible
|
|
// connected seams for each entry (i, j).
|
|
//
|
|
// - the minimum energy level is calculated by summing up the current pixel value
|
|
// with the minimum pixel value of the neighboring pixels from the previous row.
|
|
func (c *Carver) ComputeSeams(p *Processor, img *image.NRGBA) error {
|
|
var srcImg *image.NRGBA
|
|
|
|
width, height := img.Bounds().Dx(), img.Bounds().Dy()
|
|
sobel := c.SobelDetector(img, float64(p.SobelThreshold))
|
|
|
|
if p.FaceDetect && detAttempts < maxFaceDetAttempts {
|
|
var ratio float64
|
|
|
|
if width < height {
|
|
ratio = float64(width) / float64(height)
|
|
} else {
|
|
ratio = float64(height) / float64(width)
|
|
}
|
|
minSize := float64(min(width, height)) * ratio / 3
|
|
|
|
// Transform the image to pixel array.
|
|
pixels := c.rgbToGrayscale(img)
|
|
|
|
cParams := pigo.CascadeParams{
|
|
MinSize: int(minSize),
|
|
MaxSize: min(width, height),
|
|
ShiftFactor: 0.1,
|
|
ScaleFactor: 1.1,
|
|
|
|
ImageParams: pigo.ImageParams{
|
|
Pixels: pixels,
|
|
Rows: height,
|
|
Cols: width,
|
|
Dim: width,
|
|
},
|
|
}
|
|
if p.vRes {
|
|
p.FaceAngle = 0.5
|
|
}
|
|
// Run the classifier over the obtained leaf nodes and return the detection results.
|
|
// The result contains quadruplets representing the row, column, scale and detection score.
|
|
faces := p.PigoFaceDetector.RunCascade(cParams, p.FaceAngle)
|
|
|
|
// Calculate the intersection over union (IoU) of two clusters.
|
|
faces = p.PigoFaceDetector.ClusterDetections(faces, 0.1)
|
|
|
|
if len(faces) == 0 {
|
|
// Retry detecting faces for a certain amount of time.
|
|
if detAttempts < maxFaceDetAttempts {
|
|
detAttempts++
|
|
}
|
|
} else {
|
|
detAttempts = 0
|
|
}
|
|
|
|
// Range over all the detected faces and draw a white rectangle mask over each of them.
|
|
// We need to trick the sobel detector to consider them as important image parts.
|
|
for _, face := range faces {
|
|
if face.Q > 5.0 {
|
|
rect := image.Rect(
|
|
face.Col-face.Scale/2,
|
|
face.Row-face.Scale/2,
|
|
face.Col+face.Scale/2,
|
|
face.Row+face.Scale/2,
|
|
)
|
|
draw.Draw(sobel, rect, &image.Uniform{color.RGBA{255, 255, 255, 255}}, image.ZP, draw.Src)
|
|
}
|
|
}
|
|
}
|
|
|
|
// Traverse the pixel data of the binary file used for protecting the regions
|
|
// which we do not want to be altered by the seam carver,
|
|
// obtain the white patches and apply it to the sobel image.
|
|
if len(p.MaskPath) > 0 && p.Mask != nil {
|
|
for x := 0; x < width; x++ {
|
|
for y := 0; y < height; y++ {
|
|
r, g, b, a := p.Mask.At(x, y).RGBA()
|
|
if r>>8 == 0xff && g>>8 == 0xff && b>>8 == 0xff {
|
|
sobel.Set(x, y, color.RGBA{
|
|
R: uint8(r >> 8),
|
|
G: uint8(g >> 8),
|
|
B: uint8(b >> 8),
|
|
A: uint8(a >> 8),
|
|
})
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// Traverse the pixel data of the binary file used for protecting the regions
|
|
// we do not want to be altered by the seam carver, obtain the white patches,
|
|
// but this time inverse the colors to black and merge it back to the sobel image.
|
|
if len(p.RMaskPath) > 0 && p.RMask != nil {
|
|
dx, dy := p.RMask.Bounds().Max.X, p.RMask.Bounds().Max.Y
|
|
for x := 0; x < dx; x++ {
|
|
for y := 0; y < dy; y++ {
|
|
r, g, b, a := p.RMask.At(x, y).RGBA()
|
|
if r>>8 == 0xff && g>>8 == 0xff && b>>8 == 0xff {
|
|
sobel.Set(x, y, color.RGBA{
|
|
R: uint8(0x0 & r >> 8),
|
|
G: uint8(0x0 & g >> 8),
|
|
B: uint8(0x0 & b >> 8),
|
|
A: uint8(a >> 8),
|
|
})
|
|
} else {
|
|
sr, sg, sb, _ := sobel.At(x, y).RGBA()
|
|
r = uint32(min(int(sr>>8+sr>>8/2), 0xff))
|
|
g = uint32(min(int(sg>>8+sg>>8/2), 0xff))
|
|
b = uint32(min(int(sb>>8+sb>>8/2), 0xff))
|
|
|
|
sobel.Set(x, y, color.RGBA{
|
|
R: uint8(r),
|
|
G: uint8(g),
|
|
B: uint8(b),
|
|
A: uint8(a >> 8),
|
|
})
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
if p.BlurRadius > 0 {
|
|
srcImg = c.StackBlur(sobel, uint32(p.BlurRadius))
|
|
} else {
|
|
srcImg = sobel
|
|
}
|
|
|
|
for x := 0; x < c.Width; x++ {
|
|
for y := 0; y < c.Height; y++ {
|
|
r, _, _, a := srcImg.At(x, y).RGBA()
|
|
c.set(x, y, float64(r)/float64(a))
|
|
}
|
|
}
|
|
|
|
var left, middle, right float64
|
|
|
|
// Traverse the image from top to bottom and compute the minimum energy level.
|
|
// For each pixel in a row we compute the energy of the current pixel
|
|
// plus the energy of one of the three possible pixels above it.
|
|
for y := 1; y < c.Height; y++ {
|
|
for x := 1; x < c.Width-1; x++ {
|
|
left = c.get(x-1, y-1)
|
|
middle = c.get(x, y-1)
|
|
right = c.get(x+1, y-1)
|
|
min := math.Min(math.Min(left, middle), right)
|
|
// Set the minimum energy level.
|
|
c.set(x, y, c.get(x, y)+min)
|
|
}
|
|
// Special cases: pixels are far left or far right
|
|
left := c.get(0, y) + math.Min(c.get(0, y-1), c.get(1, y-1))
|
|
c.set(0, y, left)
|
|
right := c.get(0, y) + math.Min(c.get(c.Width-1, y-1), c.get(c.Width-2, y-1))
|
|
c.set(c.Width-1, y, right)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// FindLowestEnergySeams find the lowest vertical energy seam.
|
|
func (c *Carver) FindLowestEnergySeams() []Seam {
|
|
// Find the lowest cost seam from the energy matrix starting from the last row.
|
|
var (
|
|
min = math.MaxFloat64
|
|
px int
|
|
)
|
|
seams := make([]Seam, 0)
|
|
|
|
// Find the pixel on the last row with the minimum cumulative energy and use this as the starting pixel
|
|
for x := 0; x < c.Width; x++ {
|
|
seam := c.get(x, c.Height-1)
|
|
if seam < min {
|
|
min = seam
|
|
px = x
|
|
}
|
|
}
|
|
|
|
seams = append(seams, Seam{X: px, Y: c.Height - 1})
|
|
var left, middle, right float64
|
|
|
|
// Walk up in the matrix table, check the immediate three top pixel seam level
|
|
// and add the one which has the lowest cumulative energy.
|
|
for y := c.Height - 2; y >= 0; y-- {
|
|
middle = c.get(px, y)
|
|
// Leftmost seam, no child to the left
|
|
if px == 0 {
|
|
right = c.get(px+1, y)
|
|
if right < middle {
|
|
px++
|
|
}
|
|
// Rightmost seam, no child to the right
|
|
} else if px == c.Width-1 {
|
|
left = c.get(px-1, y)
|
|
if left < middle {
|
|
px--
|
|
}
|
|
} else {
|
|
left = c.get(px-1, y)
|
|
right = c.get(px+1, y)
|
|
min := math.Min(math.Min(left, middle), right)
|
|
|
|
if min == left {
|
|
px--
|
|
} else if min == right {
|
|
px++
|
|
}
|
|
}
|
|
seams = append(seams, Seam{X: px, Y: y})
|
|
}
|
|
return seams
|
|
}
|
|
|
|
// RemoveSeam remove the least important columns based on the stored energy (seams) level.
|
|
func (c *Carver) RemoveSeam(img *image.NRGBA, seams []Seam, debug bool) *image.NRGBA {
|
|
bounds := img.Bounds()
|
|
// Reduce the image width with one pixel on each iteration.
|
|
dst := image.NewNRGBA(image.Rect(0, 0, bounds.Dx()-1, bounds.Dy()))
|
|
|
|
for _, seam := range seams {
|
|
y := seam.Y
|
|
for x := 0; x < bounds.Max.X; x++ {
|
|
if seam.X == x {
|
|
if debug {
|
|
c.Seams = append(c.Seams, Seam{X: x, Y: y})
|
|
}
|
|
} else if seam.X < x {
|
|
dst.Set(x-1, y, img.At(x, y))
|
|
} else {
|
|
dst.Set(x, y, img.At(x, y))
|
|
}
|
|
}
|
|
}
|
|
return dst
|
|
}
|
|
|
|
// AddSeam add a new seam.
|
|
func (c *Carver) AddSeam(img *image.NRGBA, seams []Seam, debug bool) *image.NRGBA {
|
|
var (
|
|
currentSeam []ActiveSeam
|
|
lr, lg, lb uint32
|
|
rr, rg, rb uint32
|
|
py int
|
|
)
|
|
|
|
bounds := img.Bounds()
|
|
dst := image.NewNRGBA(image.Rect(0, 0, bounds.Dx()+1, bounds.Dy()))
|
|
|
|
for _, seam := range seams {
|
|
y := seam.Y
|
|
for x := 0; x < bounds.Max.X; x++ {
|
|
if seam.X == x {
|
|
if debug {
|
|
c.Seams = append(c.Seams, Seam{X: x, Y: y})
|
|
}
|
|
// Calculate the current seam pixel color by averaging the neighboring pixels color.
|
|
if y > 0 {
|
|
py = y - 1
|
|
} else {
|
|
py = y
|
|
}
|
|
|
|
if x > 0 {
|
|
lr, lg, lb, _ = img.At(x-1, py).RGBA()
|
|
} else {
|
|
lr, lg, lb, _ = img.At(x, y).RGBA()
|
|
}
|
|
|
|
if y < bounds.Max.Y-1 {
|
|
py = y + 1
|
|
} else {
|
|
py = y
|
|
}
|
|
|
|
if x < bounds.Max.X-1 {
|
|
rr, rg, rb, _ = img.At(x+1, py).RGBA()
|
|
} else {
|
|
rr, rg, rb, _ = img.At(x, y).RGBA()
|
|
}
|
|
avr, avg, avb := (lr+rr)/2, (lg+rg)/2, (lb+rb)/2
|
|
dst.Set(x, y, color.RGBA{uint8(avr >> 8), uint8(avg >> 8), uint8(avb >> 8), 255})
|
|
|
|
// Append the current seam position and color to the existing seams.
|
|
// To avoid picking the same optimal seam over and over again,
|
|
// each time we detect an optimal seam we assign a large positive value
|
|
// to the corresponding pixels in the energy map.
|
|
// We will increase the seams weight by duplicating the pixel value.
|
|
currentSeam = append(currentSeam,
|
|
ActiveSeam{Seam{x + 1, y},
|
|
color.RGBA{
|
|
R: uint8((avr + avr) >> 8),
|
|
G: uint8((avg + avg) >> 8),
|
|
B: uint8((avb + avb) >> 8),
|
|
A: 255,
|
|
},
|
|
})
|
|
} else if seam.X < x {
|
|
dst.Set(x, y, img.At(x-1, y))
|
|
dst.Set(x+1, y, img.At(x, y))
|
|
} else {
|
|
dst.Set(x, y, img.At(x, y))
|
|
}
|
|
}
|
|
}
|
|
usedSeams = append(usedSeams, UsedSeams{currentSeam})
|
|
return dst
|
|
}
|
|
|
|
// RotateImage90 rotate the image by 90 degree counter clockwise.
|
|
func (c *Carver) RotateImage90(src *image.NRGBA) *image.NRGBA {
|
|
b := src.Bounds()
|
|
dst := image.NewNRGBA(image.Rect(0, 0, b.Max.Y, b.Max.X))
|
|
for dstY := 0; dstY < b.Max.X; dstY++ {
|
|
for dstX := 0; dstX < b.Max.Y; dstX++ {
|
|
srcX := b.Max.X - dstY - 1
|
|
srcY := dstX
|
|
|
|
srcOff := srcY*src.Stride + srcX*4
|
|
dstOff := dstY*dst.Stride + dstX*4
|
|
copy(dst.Pix[dstOff:dstOff+4], src.Pix[srcOff:srcOff+4])
|
|
}
|
|
}
|
|
return dst
|
|
}
|
|
|
|
// RotateImage270 rotate the image by 270 degree counter clockwise.
|
|
func (c *Carver) RotateImage270(src *image.NRGBA) *image.NRGBA {
|
|
b := src.Bounds()
|
|
dst := image.NewNRGBA(image.Rect(0, 0, b.Max.Y, b.Max.X))
|
|
for dstY := 0; dstY < b.Max.X; dstY++ {
|
|
for dstX := 0; dstX < b.Max.Y; dstX++ {
|
|
srcX := dstY
|
|
srcY := b.Max.Y - dstX - 1
|
|
|
|
srcOff := srcY*src.Stride + srcX*4
|
|
dstOff := dstY*dst.Stride + dstX*4
|
|
copy(dst.Pix[dstOff:dstOff+4], src.Pix[srcOff:srcOff+4])
|
|
}
|
|
}
|
|
return dst
|
|
}
|
|
|
|
// imgToPix converts an image to a pixel array.
|
|
func (c *Carver) imgToPix(src *image.NRGBA) []uint8 {
|
|
bounds := src.Bounds()
|
|
pixels := make([]uint8, 0, bounds.Max.X*bounds.Max.Y*4)
|
|
|
|
for x := bounds.Min.X; x < bounds.Max.X; x++ {
|
|
for y := bounds.Min.Y; y < bounds.Max.Y; y++ {
|
|
r, g, b, _ := src.At(y, x).RGBA()
|
|
pixels = append(pixels, uint8(r>>8), uint8(g>>8), uint8(b>>8), 255)
|
|
}
|
|
}
|
|
return pixels
|
|
}
|
|
|
|
// pixToImage converts an array buffer to an image.
|
|
func (c *Carver) pixToImage(pixels []uint8) image.Image {
|
|
dst := image.NewNRGBA(image.Rect(0, 0, c.Width, c.Height))
|
|
bounds := dst.Bounds()
|
|
dx, dy := bounds.Max.X, bounds.Max.Y
|
|
col := color.NRGBA{
|
|
R: uint8(0),
|
|
G: uint8(0),
|
|
B: uint8(0),
|
|
A: uint8(255),
|
|
}
|
|
|
|
for x := bounds.Min.X; x < dx; x++ {
|
|
for y := bounds.Min.Y; y < dy*4; y += 4 {
|
|
col.R = uint8(pixels[y+x*dy*4])
|
|
col.G = uint8(pixels[y+x*dy*4+1])
|
|
col.B = uint8(pixels[y+x*dy*4+2])
|
|
col.A = uint8(pixels[y+x*dy*4+3])
|
|
|
|
dst.SetNRGBA(x, int(y/4), col)
|
|
}
|
|
}
|
|
return dst
|
|
}
|
|
|
|
// rgbToGrayscale converts the rgb pixel values to grayscale.
|
|
func (c *Carver) rgbToGrayscale(src *image.NRGBA) []uint8 {
|
|
width, height := src.Bounds().Dx(), src.Bounds().Dy()
|
|
gray := make([]uint8, width*height)
|
|
|
|
for y := 0; y < height; y++ {
|
|
for x := 0; x < width; x++ {
|
|
r, g, b, _ := src.At(x, y).RGBA()
|
|
gray[y*width+x] = uint8(
|
|
(0.299*float64(r) +
|
|
0.587*float64(g) +
|
|
0.114*float64(b)) / 256,
|
|
)
|
|
}
|
|
}
|
|
return gray
|
|
}
|