935 lines
31 KiB
Nim
935 lines
31 KiB
Nim
import blends, bumpy, chroma, common, masks, pixie/internal, system/memory, vmath
|
|
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
import nimsimd/sse2
|
|
|
|
const h = 0.5.float32
|
|
|
|
type
|
|
Image* = ref object
|
|
## Image object that holds bitmap data in RGBA format.
|
|
width*, height*: int
|
|
data*: seq[ColorRGBX]
|
|
|
|
when defined(release):
|
|
{.push checks: off.}
|
|
|
|
proc newImage*(width, height: int): Image {.raises: [PixieError].} =
|
|
## Creates a new image with the parameter dimensions.
|
|
if width <= 0 or height <= 0:
|
|
raise newException(PixieError, "Image width and height must be > 0")
|
|
|
|
result = Image()
|
|
result.width = width
|
|
result.height = height
|
|
result.data = newSeq[ColorRGBX](width * height)
|
|
|
|
proc newImage*(mask: Mask): Image {.raises: [PixieError].} =
|
|
result = newImage(mask.width, mask.height)
|
|
var i: int
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
for _ in countup(0, mask.data.len - 16, 4):
|
|
var alphas = unpackAlphaValues(mm_loadu_si128(mask.data[i].addr))
|
|
alphas = mm_or_si128(alphas, mm_srli_epi32(alphas, 8))
|
|
alphas = mm_or_si128(alphas, mm_srli_epi32(alphas, 16))
|
|
mm_storeu_si128(result.data[i].addr, alphas)
|
|
i += 4
|
|
|
|
for i in i ..< mask.data.len:
|
|
let v = mask.data[i]
|
|
result.data[i] = rgbx(v, v, v, v)
|
|
|
|
proc copy*(image: Image): Image {.raises: [PixieError].} =
|
|
## Copies the image data into a new image.
|
|
result = newImage(image.width, image.height)
|
|
result.data = image.data
|
|
|
|
proc `$`*(image: Image): string {.raises: [].} =
|
|
## Prints the image size.
|
|
"<Image " & $image.width & "x" & $image.height & ">"
|
|
|
|
proc inside*(image: Image, x, y: int): bool {.inline, raises: [].} =
|
|
## Returns true if (x, y) is inside the image.
|
|
x >= 0 and x < image.width and y >= 0 and y < image.height
|
|
|
|
proc dataIndex*(image: Image, x, y: int): int {.inline, raises: [].} =
|
|
image.width * y + x
|
|
|
|
proc getRgbaUnsafe*(image: Image, x, y: int): ColorRGBX {.inline, raises: [].} =
|
|
## Gets a color from (x, y) coordinates.
|
|
## * No bounds checking *
|
|
## Make sure that x, y are in bounds.
|
|
## Failure in the assumptions will case unsafe memory reads.
|
|
result = image.data[image.width * y + x]
|
|
|
|
proc `[]`*(image: Image, x, y: int): ColorRGBX {.inline, raises: [].} =
|
|
## Gets a pixel at (x, y) or returns transparent black if outside of bounds.
|
|
if image.inside(x, y):
|
|
return image.getRgbaUnsafe(x, y)
|
|
|
|
proc getColor*(image: Image, x, y: int): Color {.inline, raises: [].} =
|
|
## Gets a color at (x, y) or returns transparent black if outside of bounds.
|
|
image[x, y].color()
|
|
|
|
proc setRgbaUnsafe*(
|
|
image: Image, x, y: int, color: SomeColor
|
|
) {.inline, raises: [].} =
|
|
## Sets a color from (x, y) coordinates.
|
|
## * No bounds checking *
|
|
## Make sure that x, y are in bounds.
|
|
## Failure in the assumptions will case unsafe memory writes.
|
|
image.data[image.dataIndex(x, y)] = color.asRgbx()
|
|
|
|
proc `[]=`*(image: Image, x, y: int, color: SomeColor) {.inline, raises: [].} =
|
|
## Sets a pixel at (x, y) or does nothing if outside of bounds.
|
|
if image.inside(x, y):
|
|
image.setRgbaUnsafe(x, y, color.asRgbx())
|
|
|
|
proc setColor*(image: Image, x, y: int, color: Color) {.inline, raises: [].} =
|
|
## Sets a color at (x, y) or does nothing if outside of bounds.
|
|
image[x, y] = color.rgbx()
|
|
|
|
proc fillUnsafe*(
|
|
data: var seq[ColorRGBX], color: SomeColor, start, len: int
|
|
) {.raises: [].} =
|
|
## Fills the image data with the parameter color starting at index start and
|
|
## continuing for len indices.
|
|
|
|
let rgbx = color.asRgbx()
|
|
|
|
# Use memset when every byte has the same value
|
|
if rgbx.r == rgbx.g and rgbx.r == rgbx.b and rgbx.r == rgbx.a:
|
|
nimSetMem(data[start].addr, rgbx.r.cint, len * 4)
|
|
else:
|
|
var i = start
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
# When supported, SIMD fill until we run out of room
|
|
let m = mm_set1_epi32(cast[int32](rgbx))
|
|
for j in countup(i, start + len - 8, 8):
|
|
mm_storeu_si128(data[j].addr, m)
|
|
mm_storeu_si128(data[j + 4].addr, m)
|
|
i += 8
|
|
else:
|
|
when sizeof(int) == 8:
|
|
# Fill 8 bytes at a time when possible
|
|
let
|
|
u32 = cast[uint32](rgbx)
|
|
u64 = cast[uint64]([u32, u32])
|
|
for j in countup(i, start + len - 2, 2):
|
|
cast[ptr uint64](data[j].addr)[] = u64
|
|
i += 2
|
|
# Fill whatever is left the slow way
|
|
for j in i ..< start + len:
|
|
data[j] = rgbx
|
|
|
|
proc fill*(image: Image, color: SomeColor) {.inline, raises: [].} =
|
|
## Fills the image with the parameter color.
|
|
fillUnsafe(image.data, color, 0, image.data.len)
|
|
|
|
proc isOneColor*(image: Image): bool {.raises: [].} =
|
|
## Checks if the entire image is the same color.
|
|
result = true
|
|
|
|
let color = image.getRgbaUnsafe(0, 0)
|
|
|
|
var i: int
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
let colorVec = mm_set1_epi32(cast[int32](color))
|
|
for j in countup(0, image.data.len - 8, 8):
|
|
let
|
|
values0 = mm_loadu_si128(image.data[j].addr)
|
|
values1 = mm_loadu_si128(image.data[j + 4].addr)
|
|
mask0 = mm_movemask_epi8(mm_cmpeq_epi8(values0, colorVec))
|
|
mask1 = mm_movemask_epi8(mm_cmpeq_epi8(values1, colorVec))
|
|
if mask0 != uint16.high.int or mask1 != uint16.high.int:
|
|
return false
|
|
i += 8
|
|
|
|
for j in i ..< image.data.len:
|
|
if image.data[j] != color:
|
|
return false
|
|
|
|
proc isTransparent*(image: Image): bool {.raises: [].} =
|
|
## Checks if this image is fully transparent or not.
|
|
result = true
|
|
|
|
var i: int
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
let transparent = mm_setzero_si128()
|
|
for j in countup(0, image.data.len - 16, 16):
|
|
let
|
|
values0 = mm_loadu_si128(image.data[j].addr)
|
|
values1 = mm_loadu_si128(image.data[j + 4].addr)
|
|
values2 = mm_loadu_si128(image.data[j + 8].addr)
|
|
values3 = mm_loadu_si128(image.data[j + 12].addr)
|
|
values01 = mm_or_si128(values0, values1)
|
|
values23 = mm_or_si128(values2, values3)
|
|
values = mm_or_si128(values01, values23)
|
|
mask = mm_movemask_epi8(mm_cmpeq_epi8(values, transparent))
|
|
if mask != uint16.high.int:
|
|
return false
|
|
i += 16
|
|
|
|
for j in i ..< image.data.len:
|
|
if image.data[j].a != 0:
|
|
return false
|
|
|
|
proc flipHorizontal*(image: Image) {.raises: [].} =
|
|
## Flips the image around the Y axis.
|
|
let w = image.width div 2
|
|
for y in 0 ..< image.height:
|
|
for x in 0 ..< w:
|
|
let
|
|
rgba1 = image.getRgbaUnsafe(x, y)
|
|
rgba2 = image.getRgbaUnsafe(image.width - x - 1, y)
|
|
image.setRgbaUnsafe(image.width - x - 1, y, rgba1)
|
|
image.setRgbaUnsafe(x, y, rgba2)
|
|
|
|
proc flipVertical*(image: Image) {.raises: [].} =
|
|
## Flips the image around the X axis.
|
|
let h = image.height div 2
|
|
for y in 0 ..< h:
|
|
for x in 0 ..< image.width:
|
|
let
|
|
rgba1 = image.getRgbaUnsafe(x, y)
|
|
rgba2 = image.getRgbaUnsafe(x, image.height - y - 1)
|
|
image.setRgbaUnsafe(x, image.height - y - 1, rgba1)
|
|
image.setRgbaUnsafe(x, y, rgba2)
|
|
|
|
proc subImage*(image: Image, x, y, w, h: int): Image {.raises: [PixieError].} =
|
|
## Gets a sub image from this image.
|
|
if x < 0 or x + w > image.width:
|
|
raise newException(
|
|
PixieError,
|
|
"Params x: " & $x & " w: " & $w & " invalid, image width is " & $image.width
|
|
)
|
|
if y < 0 or y + h > image.height:
|
|
raise newException(
|
|
PixieError,
|
|
"Params y: " & $y & " h: " & $h & " invalid, image height is " & $image.height
|
|
)
|
|
|
|
result = newImage(w, h)
|
|
for y2 in 0 ..< h:
|
|
copyMem(
|
|
result.data[result.dataIndex(0, y2)].addr,
|
|
image.data[image.dataIndex(x, y + y2)].addr,
|
|
w * 4
|
|
)
|
|
|
|
proc diff*(master, image: Image): (float32, Image) {.raises: [PixieError].} =
|
|
## Compares the parameters and returns a score and image of the difference.
|
|
let
|
|
w = max(master.width, image.width)
|
|
h = max(master.height, image.height)
|
|
diffImage = newImage(w, h)
|
|
|
|
var
|
|
diffScore = 0
|
|
diffTotal = 0
|
|
for x in 0 ..< w:
|
|
for y in 0 ..< h:
|
|
let
|
|
m = master[x, y]
|
|
u = image[x, y]
|
|
diff = (m.r.int - u.r.int) + (m.g.int - u.g.int) + (m.b.int - u.b.int)
|
|
var c: ColorRGBX
|
|
c.r = abs(m.a.int - u.a.int).clamp(0, 255).uint8
|
|
c.g = diff.clamp(0, 255).uint8
|
|
c.b = (-diff).clamp(0, 255).uint8
|
|
c.a = 255
|
|
diffImage.setRgbaUnsafe(x, y, c)
|
|
diffScore += abs(m.r.int - u.r.int) +
|
|
abs(m.g.int - u.g.int) +
|
|
abs(m.b.int - u.b.int) +
|
|
abs(m.a.int - u.a.int)
|
|
diffTotal += 255 * 4
|
|
|
|
(100 * diffScore.float32 / diffTotal.float32, diffImage)
|
|
|
|
proc minifyBy2*(image: Image, power = 1): Image {.raises: [PixieError].} =
|
|
## Scales the image down by an integer scale.
|
|
if power < 0:
|
|
raise newException(PixieError, "Cannot minifyBy2 with negative power")
|
|
if power == 0:
|
|
return image.copy()
|
|
|
|
var src = image
|
|
for _ in 1 .. power:
|
|
result = newImage(src.width div 2, src.height div 2)
|
|
for y in 0 ..< result.height:
|
|
var x: int
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
let
|
|
oddMask = mm_set1_epi16(cast[int16](0xff00))
|
|
first32 = cast[M128i]([uint32.high, 0, 0, 0])
|
|
for _ in countup(0, result.width - 4, 2):
|
|
let
|
|
top = mm_loadu_si128(src.data[src.dataIndex(x * 2, y * 2 + 0)].addr)
|
|
btm = mm_loadu_si128(src.data[src.dataIndex(x * 2, y * 2 + 1)].addr)
|
|
topShifted = mm_srli_si128(top, 4)
|
|
btmShifted = mm_srli_si128(btm, 4)
|
|
|
|
topEven = mm_andnot_si128(oddMask, top)
|
|
topOdd = mm_srli_epi16(mm_and_si128(top, oddMask), 8)
|
|
btmEven = mm_andnot_si128(oddMask, btm)
|
|
btmOdd = mm_srli_epi16(mm_and_si128(btm, oddMask), 8)
|
|
|
|
topShiftedEven = mm_andnot_si128(oddMask, topShifted)
|
|
topShiftedOdd = mm_srli_epi16(mm_and_si128(topShifted, oddMask), 8)
|
|
btmShiftedEven = mm_andnot_si128(oddMask, btmShifted)
|
|
btmShiftedOdd = mm_srli_epi16(mm_and_si128(btmShifted, oddMask), 8)
|
|
|
|
topAddedEven = mm_add_epi16(topEven, topShiftedEven)
|
|
btmAddedEven = mm_add_epi16(btmEven, btmShiftedEven)
|
|
topAddedOdd = mm_add_epi16(topOdd, topShiftedOdd)
|
|
bottomAddedOdd = mm_add_epi16(btmOdd, btmShiftedOdd)
|
|
|
|
addedEven = mm_add_epi16(topAddedEven, btmAddedEven)
|
|
addedOdd = mm_add_epi16(topAddedOdd, bottomAddedOdd)
|
|
|
|
addedEvenDiv4 = mm_srli_epi16(addedEven, 2)
|
|
addedOddDiv4 = mm_srli_epi16(addedOdd, 2)
|
|
|
|
merged = mm_or_si128(addedEvenDiv4, mm_slli_epi16(addedOddDiv4, 8))
|
|
|
|
# merged [0, 1, 2, 3] has the correct values for the next two pixels
|
|
# at index 0 and 2 so shift those into position and store
|
|
|
|
zero = mm_and_si128(merged, first32)
|
|
two = mm_and_si128(mm_srli_si128(merged, 8), first32)
|
|
zeroTwo = mm_or_si128(zero, mm_slli_si128(two, 4))
|
|
|
|
mm_storeu_si128(result.data[result.dataIndex(x, y)].addr, zeroTwo)
|
|
x += 2
|
|
|
|
for x in x ..< result.width:
|
|
let
|
|
a = src.getRgbaUnsafe(x * 2 + 0, y * 2 + 0)
|
|
b = src.getRgbaUnsafe(x * 2 + 1, y * 2 + 0)
|
|
c = src.getRgbaUnsafe(x * 2 + 1, y * 2 + 1)
|
|
d = src.getRgbaUnsafe(x * 2 + 0, y * 2 + 1)
|
|
rgba = rgbx(
|
|
((a.r.uint32 + b.r + c.r + d.r) div 4).uint8,
|
|
((a.g.uint32 + b.g + c.g + d.g) div 4).uint8,
|
|
((a.b.uint32 + b.b + c.b + d.b) div 4).uint8,
|
|
((a.a.uint32 + b.a + c.a + d.a) div 4).uint8
|
|
)
|
|
|
|
result.setRgbaUnsafe(x, y, rgba)
|
|
|
|
# Set src as this result for if we do another power
|
|
src = result
|
|
|
|
proc magnifyBy2*(image: Image, power = 1): Image {.raises: [PixieError].} =
|
|
## Scales image up by 2 ^ power.
|
|
if power < 0:
|
|
raise newException(PixieError, "Cannot magnifyBy2 with negative power")
|
|
|
|
let scale = 2 ^ power
|
|
result = newImage(image.width * scale, image.height * scale)
|
|
for y in 0 ..< result.height:
|
|
for x in 0 ..< image.width:
|
|
let
|
|
rgba = image.getRgbaUnsafe(x, y div scale)
|
|
idx = result.dataIndex(x * scale, y)
|
|
for i in 0 ..< scale div 2:
|
|
result.data[idx + i * 2 + 0] = rgba
|
|
result.data[idx + i * 2 + 1] = rgba
|
|
|
|
proc applyOpacity*(target: Image | Mask, opacity: float32) {.raises: [].} =
|
|
## Multiplies alpha of the image by opacity.
|
|
let opacity = round(255 * opacity).uint16
|
|
|
|
if opacity == 0:
|
|
when type(target) is Image:
|
|
target.fill(rgbx(0, 0, 0, 0))
|
|
else:
|
|
target.fill(0)
|
|
return
|
|
|
|
var i: int
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
when type(target) is Image:
|
|
let byteLen = target.data.len * 4
|
|
else:
|
|
let byteLen = target.data.len
|
|
|
|
let
|
|
oddMask = mm_set1_epi16(cast[int16](0xff00))
|
|
div255 = mm_set1_epi16(cast[int16](0x8081))
|
|
vOpacity = mm_slli_epi16(mm_set1_epi16(cast[int16](opacity)), 8)
|
|
|
|
for _ in countup(0, byteLen - 16, 16):
|
|
when type(target) is Image:
|
|
let index = i div 4
|
|
else:
|
|
let index = i
|
|
|
|
let values = mm_loadu_si128(target.data[index].addr)
|
|
|
|
let eqZero = mm_cmpeq_epi16(values, mm_setzero_si128())
|
|
if mm_movemask_epi8(eqZero) != 0xffff:
|
|
var
|
|
valuesEven = mm_slli_epi16(mm_andnot_si128(oddMask, values), 8)
|
|
valuesOdd = mm_and_si128(values, oddMask)
|
|
|
|
# values * opacity
|
|
valuesEven = mm_mulhi_epu16(valuesEven, vOpacity)
|
|
valuesOdd = mm_mulhi_epu16(valuesOdd, vOpacity)
|
|
|
|
# div 255
|
|
valuesEven = mm_srli_epi16(mm_mulhi_epu16(valuesEven, div255), 7)
|
|
valuesOdd = mm_srli_epi16(mm_mulhi_epu16(valuesOdd, div255), 7)
|
|
|
|
valuesOdd = mm_slli_epi16(valuesOdd, 8)
|
|
|
|
mm_storeu_si128(
|
|
target.data[index].addr,
|
|
mm_or_si128(valuesEven, valuesOdd)
|
|
)
|
|
|
|
i += 16
|
|
|
|
when type(target) is Image:
|
|
for j in i div 4 ..< target.data.len:
|
|
var rgba = target.data[j]
|
|
rgba.r = ((rgba.r * opacity) div 255).uint8
|
|
rgba.g = ((rgba.g * opacity) div 255).uint8
|
|
rgba.b = ((rgba.b * opacity) div 255).uint8
|
|
rgba.a = ((rgba.a * opacity) div 255).uint8
|
|
target.data[j] = rgba
|
|
else:
|
|
for j in i ..< target.data.len:
|
|
target.data[j] = ((target.data[j] * opacity) div 255).uint8
|
|
|
|
proc invert*(target: Image | Mask) {.raises: [].} =
|
|
## Inverts all of the colors and alpha.
|
|
var i: int
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
let v255 = mm_set1_epi8(cast[int8](255))
|
|
|
|
when type(target) is Image:
|
|
let byteLen = target.data.len * 4
|
|
else:
|
|
let byteLen = target.data.len
|
|
|
|
for _ in countup(0, byteLen - 16, 16):
|
|
when type(target) is Image:
|
|
let index = i div 4
|
|
else:
|
|
let index = i
|
|
|
|
var values = mm_loadu_si128(target.data[index].addr)
|
|
values = mm_sub_epi8(v255, values)
|
|
mm_storeu_si128(target.data[index].addr, values)
|
|
|
|
i += 16
|
|
|
|
when type(target) is Image:
|
|
for j in i div 4 ..< target.data.len:
|
|
var rgba = target.data[j]
|
|
rgba.r = 255 - rgba.r
|
|
rgba.g = 255 - rgba.g
|
|
rgba.b = 255 - rgba.b
|
|
rgba.a = 255 - rgba.a
|
|
target.data[j] = rgba
|
|
|
|
# Inverting rgbx(50, 100, 150, 200) becomes rgbx(205, 155, 105, 55). This
|
|
# is not a valid premultiplied alpha color.
|
|
# We need to convert back to premultiplied alpha after inverting.
|
|
target.data.toPremultipliedAlpha()
|
|
else:
|
|
for j in i ..< target.data.len:
|
|
target.data[j] = (255 - target.data[j]).uint8
|
|
|
|
proc blur*(
|
|
image: Image, radius: float32, outOfBounds: SomeColor = color(0, 0, 0, 0)
|
|
) {.raises: [PixieError].} =
|
|
## Applies Gaussian blur to the image given a radius.
|
|
let radius = round(radius).int
|
|
if radius == 0:
|
|
return
|
|
if radius < 0:
|
|
raise newException(PixieError, "Cannot apply negative blur")
|
|
|
|
let
|
|
kernel = gaussianKernel(radius)
|
|
outOfBounds = outOfBounds.asRgbx()
|
|
|
|
proc `*`(sample: ColorRGBX, a: uint32): array[4, uint32] {.inline.} =
|
|
[
|
|
sample.r * a,
|
|
sample.g * a,
|
|
sample.b * a,
|
|
sample.a * a
|
|
]
|
|
|
|
template `+=`(values: var array[4, uint32], sample: array[4, uint32]) =
|
|
values[0] += sample[0]
|
|
values[1] += sample[1]
|
|
values[2] += sample[2]
|
|
values[3] += sample[3]
|
|
|
|
template rgbx(values: array[4, uint32]): ColorRGBX =
|
|
rgbx(
|
|
(values[0] div 256 div 255).uint8,
|
|
(values[1] div 256 div 255).uint8,
|
|
(values[2] div 256 div 255).uint8,
|
|
(values[3] div 256 div 255).uint8
|
|
)
|
|
|
|
# Blur in the X direction. Store with dimensions swapped for reading later.
|
|
let blurX = newImage(image.height, image.width)
|
|
for y in 0 ..< image.height:
|
|
for x in 0 ..< image.width:
|
|
var values: array[4, uint32]
|
|
for xx in x - radius ..< min(x + radius, 0):
|
|
values += outOfBounds * kernel[xx - x + radius]
|
|
for xx in max(x - radius, 0) .. min(x + radius, image.width - 1):
|
|
values += image.getRgbaUnsafe(xx, y) * kernel[xx - x + radius]
|
|
for xx in max(x - radius, image.width) .. x + radius:
|
|
values += outOfBounds * kernel[xx - x + radius]
|
|
blurX.setRgbaUnsafe(y, x, rgbx(values))
|
|
|
|
# Blur in the Y direction.
|
|
for y in 0 ..< image.height:
|
|
for x in 0 ..< image.width:
|
|
var values: array[4, uint32]
|
|
for yy in y - radius ..< min(y + radius, 0):
|
|
values += outOfBounds * kernel[yy - y + radius]
|
|
for yy in max(y - radius, 0) .. min(y + radius, image.height - 1):
|
|
values += blurX.getRgbaUnsafe(yy, x) * kernel[yy - y + radius]
|
|
for yy in max(y - radius, image.height) .. y + radius:
|
|
values += outOfBounds * kernel[yy - y + radius]
|
|
image.setRgbaUnsafe(x, y, rgbx(values))
|
|
|
|
proc newMask*(image: Image): Mask {.raises: [PixieError].} =
|
|
## Returns a new mask using the alpha values of the parameter image.
|
|
result = newMask(image.width, image.height)
|
|
|
|
var i: int
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
for _ in countup(0, image.data.len - 16, 16):
|
|
var
|
|
a = mm_loadu_si128(image.data[i + 0].addr)
|
|
b = mm_loadu_si128(image.data[i + 4].addr)
|
|
c = mm_loadu_si128(image.data[i + 8].addr)
|
|
d = mm_loadu_si128(image.data[i + 12].addr)
|
|
|
|
a = packAlphaValues(a)
|
|
b = packAlphaValues(b)
|
|
c = packAlphaValues(c)
|
|
d = packAlphaValues(d)
|
|
|
|
b = mm_slli_si128(b, 4)
|
|
c = mm_slli_si128(c, 8)
|
|
d = mm_slli_si128(d, 12)
|
|
|
|
mm_storeu_si128(
|
|
result.data[i].addr,
|
|
mm_or_si128(mm_or_si128(a, b), mm_or_si128(c, d))
|
|
)
|
|
|
|
i += 16
|
|
|
|
for j in i ..< image.data.len:
|
|
result.data[j] = image.data[j].a
|
|
|
|
proc getRgbaSmooth*(
|
|
image: Image, x, y: float32, wrapped = false
|
|
): ColorRGBX {.raises: [].} =
|
|
## Gets a interpolated color with float point coordinates.
|
|
## Pixes outside the image are transparent.
|
|
let
|
|
x0 = x.floor.int
|
|
y0 = y.floor.int
|
|
x1 = x0 + 1
|
|
y1 = y0 + 1
|
|
xFractional = x - x.floor
|
|
yFractional = y - y.floor
|
|
|
|
var x0y0, x1y0, x0y1, x1y1: ColorRGBX
|
|
if wrapped:
|
|
x0y0 = image.getRgbaUnsafe(x0 mod image.width, y0 mod image.height)
|
|
x1y0 = image.getRgbaUnsafe(x1 mod image.width, y0 mod image.height)
|
|
x0y1 = image.getRgbaUnsafe(x0 mod image.width, y1 mod image.height)
|
|
x1y1 = image.getRgbaUnsafe(x1 mod image.width, y1 mod image.height)
|
|
else:
|
|
x0y0 = image[x0, y0]
|
|
x1y0 = image[x1, y0]
|
|
x0y1 = image[x0, y1]
|
|
x1y1 = image[x1, y1]
|
|
|
|
var topMix = x0y0
|
|
if xFractional > 0 and x0y0 != x1y0:
|
|
topMix = mix(x0y0, x1y0, xFractional)
|
|
|
|
var bottomMix = x0y1
|
|
if xFractional > 0 and x0y1 != x1y1:
|
|
bottomMix = mix(x0y1, x1y1, xFractional)
|
|
|
|
if yFractional != 0 and topMix != bottomMix:
|
|
mix(topMix, bottomMix, yFractional)
|
|
else:
|
|
topMix
|
|
|
|
proc drawCorrect(
|
|
a, b: Image | Mask, mat = mat3(), tiled = false, blendMode = bmNormal
|
|
) {.raises: [PixieError].} =
|
|
## Draws one image onto another using matrix with color blending.
|
|
|
|
when type(a) is Image:
|
|
let blender = blendMode.blender()
|
|
else: # a is a Mask
|
|
let masker = blendMode.masker()
|
|
|
|
var
|
|
matInv = mat.inverse()
|
|
# Compute movement vectors
|
|
p = matInv * vec2(0 + h, 0 + h)
|
|
dx = matInv * vec2(1 + h, 0 + h) - p
|
|
dy = matInv * vec2(0 + h, 1 + h) - p
|
|
filterBy2 = max(dx.length, dy.length)
|
|
b = b
|
|
|
|
while filterBy2 >= 2.0:
|
|
b = b.minifyBy2()
|
|
p /= 2
|
|
dx /= 2
|
|
dy /= 2
|
|
filterBy2 /= 2
|
|
matInv = scale(vec2(1/2, 1/2)) * matInv
|
|
|
|
while filterBy2 <= 0.5:
|
|
b = b.magnifyBy2()
|
|
p *= 2
|
|
dx *= 2
|
|
dy *= 2
|
|
filterBy2 *= 2
|
|
matInv = scale(vec2(2, 2)) * matInv
|
|
|
|
for y in 0 ..< a.height:
|
|
for x in 0 ..< a.width:
|
|
let
|
|
samplePos = matInv * vec2(x.float32 + h, y.float32 + h)
|
|
xFloat = samplePos.x - h
|
|
yFloat = samplePos.y - h
|
|
|
|
when type(a) is Image:
|
|
let backdrop = a.getRgbaUnsafe(x, y)
|
|
when type(b) is Image:
|
|
let
|
|
sample = b.getRgbaSmooth(xFloat, yFloat, tiled)
|
|
blended = blender(backdrop, sample)
|
|
else: # b is a Mask
|
|
let
|
|
sample = b.getValueSmooth(xFloat, yFloat)
|
|
blended = blender(backdrop, rgbx(0, 0, 0, sample))
|
|
a.setRgbaUnsafe(x, y, blended)
|
|
else: # a is a Mask
|
|
let backdrop = a.getValueUnsafe(x, y)
|
|
when type(b) is Image:
|
|
let sample = b.getRgbaSmooth(xFloat, yFloat, tiled).a
|
|
else: # b is a Mask
|
|
let sample = b.getValueSmooth(xFloat, yFloat)
|
|
a.setValueUnsafe(x, y, masker(backdrop, sample))
|
|
|
|
proc drawUber(
|
|
a, b: Image | Mask, mat = mat3(), blendMode = bmNormal
|
|
) {.raises: [PixieError].} =
|
|
let
|
|
corners = [
|
|
mat * vec2(0, 0),
|
|
mat * vec2(b.width.float32, 0),
|
|
mat * vec2(b.width.float32, b.height.float32),
|
|
mat * vec2(0, b.height.float32)
|
|
]
|
|
perimeter = [
|
|
segment(corners[0], corners[1]),
|
|
segment(corners[1], corners[2]),
|
|
segment(corners[2], corners[3]),
|
|
segment(corners[3], corners[0])
|
|
]
|
|
|
|
var
|
|
matInv = mat.inverse()
|
|
# Compute movement vectors
|
|
p = matInv * vec2(0 + h, 0 + h)
|
|
dx = matInv * vec2(1 + h, 0 + h) - p
|
|
dy = matInv * vec2(0 + h, 1 + h) - p
|
|
filterBy2 = max(dx.length, dy.length)
|
|
b = b
|
|
|
|
while filterBy2 >= 2.0:
|
|
b = b.minifyBy2()
|
|
p /= 2
|
|
dx /= 2
|
|
dy /= 2
|
|
filterBy2 /= 2
|
|
|
|
while filterBy2 <= 0.5:
|
|
b = b.magnifyBy2()
|
|
p *= 2
|
|
dx *= 2
|
|
dy *= 2
|
|
filterBy2 *= 2
|
|
|
|
let smooth = not(
|
|
dx.length == 1.0 and
|
|
dy.length == 1.0 and
|
|
mat[2, 0].fractional == 0.0 and
|
|
mat[2, 1].fractional == 0.0
|
|
)
|
|
|
|
when type(a) is Image:
|
|
let blender = blendMode.blender()
|
|
else: # a is a Mask
|
|
let masker = blendMode.masker()
|
|
|
|
# Determine where we should start and stop drawing in the y dimension
|
|
var yMin, yMax: int
|
|
if blendMode == bmMask:
|
|
yMin = 0
|
|
yMax = a.height
|
|
else:
|
|
yMin = a.height
|
|
yMax = 0
|
|
for segment in perimeter:
|
|
yMin = min(yMin, segment.at.y.floor.int)
|
|
yMax = max(yMax, segment.at.y.ceil.int)
|
|
|
|
yMin = yMin.clamp(0, a.height)
|
|
yMax = yMax.clamp(0, a.height)
|
|
|
|
for y in yMin ..< yMax:
|
|
# Determine where we should start and stop drawing in the x dimension
|
|
var
|
|
xMin = a.width
|
|
xMax = 0
|
|
for yOffset in [0.float32, 1]:
|
|
let scanLine = Line(
|
|
a: vec2(-1000, y.float32 + yOffset),
|
|
b: vec2(1000, y.float32 + yOffset)
|
|
)
|
|
for segment in perimeter:
|
|
var at: Vec2
|
|
if scanline.intersects(segment, at) and segment.to != at:
|
|
xMin = min(xMin, at.x.floor.int)
|
|
xMax = max(xMax, at.x.ceil.int)
|
|
|
|
xMin = xMin.clamp(0, a.width)
|
|
xMax = xMax.clamp(0, a.width)
|
|
|
|
if blendMode == bmMask:
|
|
if xMin > 0:
|
|
zeroMem(a.data[a.dataIndex(0, y)].addr, 4 * xMin)
|
|
|
|
if smooth:
|
|
var srcPos = p + dx * xMin.float32 + dy * y.float32
|
|
srcPos = vec2(srcPos.x - h, srcPos.y - h)
|
|
|
|
for x in xMin ..< xMax:
|
|
when type(a) is Image:
|
|
let backdrop = a.getRgbaUnsafe(x, y)
|
|
when type(b) is Image:
|
|
let
|
|
sample = b.getRgbaSmooth(srcPos.x, srcPos.y)
|
|
blended = blender(backdrop, sample)
|
|
else: # b is a Mask
|
|
let
|
|
sample = b.getValueSmooth(srcPos.x, srcPos.y)
|
|
blended = blender(backdrop, rgbx(0, 0, 0, sample))
|
|
a.setRgbaUnsafe(x, y, blended)
|
|
else: # a is a Mask
|
|
let backdrop = a.getValueUnsafe(x, y)
|
|
when type(b) is Image:
|
|
let sample = b.getRgbaSmooth(srcPos.x, srcPos.y).a
|
|
else: # b is a Mask
|
|
let sample = b.getValueSmooth(srcPos.x, srcPos.y)
|
|
a.setValueUnsafe(x, y, masker(backdrop, sample))
|
|
|
|
srcPos += dx
|
|
|
|
else:
|
|
var x = xMin
|
|
when defined(amd64) and not defined(pixieNoSimd):
|
|
if dx == vec2(1, 0) and dy == vec2(0, 1):
|
|
# Check we are not rotated before using SIMD blends
|
|
when type(a) is Image:
|
|
if blendMode.hasSimdBlender():
|
|
let blenderSimd = blendMode.blenderSimd()
|
|
for _ in countup(x, xMax - 16, 16):
|
|
let
|
|
srcPos = p + dx * x.float32 + dy * y.float32
|
|
sx = srcPos.x.int
|
|
sy = srcPos.y.int
|
|
when type(b) is Image:
|
|
for q in [0, 4, 8, 12]:
|
|
let
|
|
backdrop = mm_loadu_si128(a.data[a.dataIndex(x + q, y)].addr)
|
|
source = mm_loadu_si128(b.data[b.dataIndex(sx + q, sy)].addr)
|
|
mm_storeu_si128(
|
|
a.data[a.dataIndex(x + q, y)].addr,
|
|
blenderSimd(backdrop, source)
|
|
)
|
|
else: # b is a Mask
|
|
var values = mm_loadu_si128(b.data[b.dataIndex(sx, sy)].addr)
|
|
for q in [0, 4, 8, 12]:
|
|
let
|
|
backdrop = mm_loadu_si128(a.data[a.dataIndex(x + q, y)].addr)
|
|
source = unpackAlphaValues(values)
|
|
mm_storeu_si128(
|
|
a.data[a.dataIndex(x + q, y)].addr,
|
|
blenderSimd(backdrop, source)
|
|
)
|
|
# Shuffle 32 bits off for the next iteration
|
|
values = mm_srli_si128(values, 4)
|
|
x += 16
|
|
else: # is a Mask
|
|
if blendMode.hasSimdMasker():
|
|
let maskerSimd = blendMode.maskerSimd()
|
|
for _ in countup(x, xMax - 16, 16):
|
|
let
|
|
srcPos = p + dx * x.float32 + dy * y.float32
|
|
sx = srcPos.x.int
|
|
sy = srcPos.y.int
|
|
backdrop = mm_loadu_si128(a.data[a.dataIndex(x, y)].addr)
|
|
when type(b) is Image:
|
|
# Need to read 16 colors and pack their alpha values
|
|
var
|
|
i = mm_loadu_si128(b.data[b.dataIndex(sx + 0, sy)].addr)
|
|
j = mm_loadu_si128(b.data[b.dataIndex(sx + 4, sy)].addr)
|
|
k = mm_loadu_si128(b.data[b.dataIndex(sx + 8, sy)].addr)
|
|
l = mm_loadu_si128(b.data[b.dataIndex(sx + 12, sy)].addr)
|
|
|
|
i = packAlphaValues(i)
|
|
j = packAlphaValues(j)
|
|
k = packAlphaValues(k)
|
|
l = packAlphaValues(l)
|
|
|
|
j = mm_slli_si128(j, 4)
|
|
k = mm_slli_si128(k, 8)
|
|
l = mm_slli_si128(l, 12)
|
|
|
|
let source = mm_or_si128(mm_or_si128(i, j), mm_or_si128(k, l))
|
|
else: # b is a Mask
|
|
let source = mm_loadu_si128(b.data[b.dataIndex(sx, sy)].addr)
|
|
|
|
mm_storeu_si128(
|
|
a.data[a.dataIndex(x, y)].addr,
|
|
maskerSimd(backdrop, source)
|
|
)
|
|
x += 16
|
|
|
|
var srcPos = p + dx * x.float32 + dy * y.float32
|
|
srcPos = vec2(max(0, srcPos.x), max(0, srcPos.y))
|
|
|
|
for x in x ..< xMax:
|
|
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
|
|
|
when type(a) is Image:
|
|
let backdrop = a.getRgbaUnsafe(x, y)
|
|
when type(b) is Image:
|
|
let
|
|
sample = b.getRgbaUnsafe(samplePos.x, samplePos.y)
|
|
blended = blender(backdrop, sample)
|
|
else: # b is a Mask
|
|
let
|
|
sample = b.getValueUnsafe(samplePos.x, samplePos.y)
|
|
blended = blender(backdrop, rgbx(0, 0, 0, sample))
|
|
a.setRgbaUnsafe(x, y, blended)
|
|
else: # a is a Mask
|
|
let backdrop = a.getValueUnsafe(x, y)
|
|
when type(b) is Image:
|
|
let sample = b.getRgbaUnsafe(samplePos.x, samplePos.y).a
|
|
else: # b is a Mask
|
|
let sample = b.getValueUnsafe(samplePos.x, samplePos.y)
|
|
a.setValueUnsafe(x, y, masker(backdrop, sample))
|
|
|
|
srcPos += dx
|
|
|
|
if blendMode == bmMask:
|
|
if a.width - xMax > 0:
|
|
zeroMem(a.data[a.dataIndex(xMax, y)].addr, 4 * (a.width - xMax))
|
|
|
|
proc draw*(
|
|
a, b: Image, transform = mat3(), blendMode = bmNormal
|
|
) {.inline, raises: [PixieError].} =
|
|
## Draws one image onto another using matrix with color blending.
|
|
when type(transform) is Vec2:
|
|
a.drawUber(b, translate(transform), blendMode)
|
|
else:
|
|
a.drawUber(b, transform, blendMode)
|
|
|
|
proc draw*(
|
|
a, b: Mask, transform = mat3(), blendMode = bmMask
|
|
) {.inline, raises: [PixieError].} =
|
|
## Draws a mask onto a mask using a matrix with color blending.
|
|
when type(transform) is Vec2:
|
|
a.drawUber(b, translate(transform), blendMode)
|
|
else:
|
|
a.drawUber(b, transform, blendMode)
|
|
|
|
proc draw*(
|
|
image: Image, mask: Mask, transform = mat3(), blendMode = bmMask
|
|
) {.inline, raises: [PixieError].} =
|
|
## Draws a mask onto an image using a matrix with color blending.
|
|
when type(transform) is Vec2:
|
|
image.drawUber(mask, translate(transform), blendMode)
|
|
else:
|
|
image.drawUber(mask, transform, blendMode)
|
|
|
|
proc draw*(
|
|
mask: Mask, image: Image, transform = mat3(), blendMode = bmMask
|
|
) {.inline, raises: [PixieError].} =
|
|
## Draws a image onto a mask using a matrix with color blending.
|
|
when type(transform) is Vec2:
|
|
mask.drawUber(image, translate(transform), blendMode)
|
|
else:
|
|
mask.drawUber(image, transform, blendMode)
|
|
|
|
proc drawTiled*(
|
|
dst, src: Image, mat: Mat3, blendMode = bmNormal
|
|
) {.raises: [PixieError].} =
|
|
dst.drawCorrect(src, mat, true, blendMode)
|
|
|
|
proc resize*(srcImage: Image, width, height: int): Image {.raises: [PixieError].} =
|
|
## Resize an image to a given height and width.
|
|
if width == srcImage.width and height == srcImage.height:
|
|
result = srcImage.copy()
|
|
else:
|
|
result = newImage(width, height)
|
|
result.draw(
|
|
srcImage,
|
|
scale(vec2(
|
|
width.float32 / srcImage.width.float32,
|
|
height.float32 / srcImage.height.float32
|
|
)),
|
|
bmOverwrite
|
|
)
|
|
|
|
proc shadow*(
|
|
image: Image, offset: Vec2, spread, blur: float32, color: SomeColor
|
|
): Image {.raises: [PixieError].} =
|
|
## Create a shadow of the image with the offset, spread and blur.
|
|
let
|
|
mask = image.newMask()
|
|
shifted = newMask(mask.width, mask.height)
|
|
shifted.draw(mask, translate(offset), bmOverwrite)
|
|
shifted.spread(spread)
|
|
shifted.blur(blur)
|
|
result = newImage(shifted.width, shifted.height)
|
|
result.fill(color)
|
|
result.draw(shifted, blendMode = bmMask)
|
|
|
|
proc superImage*(image: Image, x, y, w, h: int): Image {.raises: [PixieError].} =
|
|
## Either cuts a sub image or returns a super image with padded transparency.
|
|
if x >= 0 and x + w <= image.width and y >= 0 and y + h <= image.height:
|
|
result = image.subImage(x, y, w, h)
|
|
else:
|
|
result = newImage(w, h)
|
|
result.draw(image, translate(vec2(-x.float32, -y.float32)), bmOverwrite)
|
|
|
|
when defined(release):
|
|
{.pop.}
|