all int blends, simd alphafix + softlight, benchmarks

This commit is contained in:
Ryan Oldenburg 2020-12-09 07:47:58 -06:00
parent 8ef4b3ecc8
commit b895030088
2 changed files with 276 additions and 72 deletions

View file

@ -111,6 +111,10 @@ proc SetSat(C: Color, s: float32): Color {.inline.} =
result = (C - min([C.r, C.g, C.b])) * s / satC
proc alphaFix(backdrop, source, mixed: Color): Color =
result.a = (source.a + backdrop.a * (1.0 - source.a))
if result.a == 0:
return
let
t0 = source.a * (1 - backdrop.a)
t1 = source.a * backdrop.a
@ -120,7 +124,6 @@ proc alphaFix(backdrop, source, mixed: Color): Color =
result.g = t0 * source.g + t1 * mixed.g + t2 * backdrop.g
result.b = t0 * source.b + t1 * mixed.b + t2 * backdrop.b
result.a = (source.a + backdrop.a * (1.0 - source.a))
result.r /= result.a
result.g /= result.a
result.b /= result.a
@ -258,25 +261,22 @@ proc blendExcludeMaskFloats(backdrop, source: Color): Color {.inline.} =
proc blendOverwriteFloats(backdrop, source: Color): Color {.inline.} =
source
proc alphaFix(backdrop, source, mixed: ColorRGBA): ColorRGBA {.inline.} =
proc alphaFix(backdrop, source: ColorRGBA, vb, vs, vm: M128): ColorRGBA =
let
sa = source.a.float32
ba = backdrop.a.float32
a = sa + ba * (255 - sa) / 255
if a < 1:
if a == 0:
return
let
vb = mm_setr_ps(backdrop.r.float32, backdrop.g.float32, backdrop.b.float32, 0)
vs = mm_setr_ps(source.r.float32, source.g.float32, source.b.float32, 0)
vm = mm_setr_ps(mixed.r.float32, mixed.g.float32, mixed.b.float32, 0)
vt0 = mm_set1_ps(sa * (255 - ba))
vt1 = mm_set1_ps(sa * ba)
vt2 = mm_set1_ps((255 - sa) * ba)
t0 = mm_set1_ps(sa * (255 - ba))
t1 = mm_set1_ps(sa * ba)
t2 = mm_set1_ps((255 - sa) * ba)
va = mm_set1_ps(a)
v255 = mm_set1_ps(255)
values = cast[array[4, int32]](
mm_cvtps_epi32((vt0 * vs + vt1 * vm + vt2 * vb) / va / v255)
values = cast[array[4, uint32]](
mm_cvtps_epi32((t0 * vs + t1 * vm + t2 * vb) / va / v255)
)
result.r = values[0].uint8
@ -284,48 +284,140 @@ proc alphaFix(backdrop, source, mixed: ColorRGBA): ColorRGBA {.inline.} =
result.b = values[2].uint8
result.a = a.uint8
proc alphaFix(backdrop, source, mixed: ColorRGBA): ColorRGBA {.inline.} =
if backdrop.a == 0 and source.a == 0:
return
let
vb = mm_setr_ps(backdrop.r.float32, backdrop.g.float32, backdrop.b.float32, 0)
vs = mm_setr_ps(source.r.float32, source.g.float32, source.b.float32, 0)
vm = mm_setr_ps(mixed.r.float32, mixed.g.float32, mixed.b.float32, 0)
alphaFix(backdrop, source, vb, vs, vm)
proc min(a, b: uint32): uint32 {.inline.} =
if a < b: a else: b
proc screen(backdrop, source: uint32): uint8 {.inline.} =
(255 - ((255 - backdrop) * (255 - source)) div 255).uint8
proc hardLight(backdrop, source: uint32): uint8 {.inline.} =
if source <= 127:
((backdrop * 2 * source) div 255).uint8
else:
screen(backdrop, 2 * source - 255)
proc blendNormal(backdrop, source: ColorRGBA): ColorRGBA =
result = source
result = alphaFix(backdrop, source, result)
proc blendDarken(backdrop, source: ColorRGBA): ColorRGBA =
blendDarkenFloats(backdrop.color, source.color).rgba
result.r = min(backdrop.r, source.r)
result.g = min(backdrop.g, source.g)
result.b = min(backdrop.b, source.b)
result = alphaFix(backdrop, source, result)
proc blendMultiply(backdrop, source: ColorRGBA): ColorRGBA =
blendMultiplyFloats(backdrop.color, source.color).rgba
result.r = ((backdrop.r.uint32 * source.r) div 255).uint8
result.g = ((backdrop.g.uint32 * source.g) div 255).uint8
result.b = ((backdrop.b.uint32 * source.b) div 255).uint8
result = alphaFix(backdrop, source, result)
proc blendLinearBurn(backdrop, source: ColorRGBA): ColorRGBA =
blendLinearBurnFloats(backdrop.color, source.color).rgba
result.r = min(0, backdrop.r.int16 + source.r.int16 - 255).uint8
result.g = min(0, backdrop.g.int16 + source.g.int16 - 255).uint8
result.b = min(0, backdrop.b.int16 + source.b.int16 - 255).uint8
result = alphaFix(backdrop, source, result)
proc blendColorBurn(backdrop, source: ColorRGBA): ColorRGBA =
blendColorBurnFloats(backdrop.color, source.color).rgba
proc blend(backdrop, source: uint32): uint8 {.inline.} =
if backdrop == 255:
255.uint8
elif source == 0:
0
else:
255 - min(255, (255 * (255 - backdrop)) div source).uint8
result.r = blend(backdrop.r, source.r)
result.g = blend(backdrop.g, source.g)
result.b = blend(backdrop.b, source.b)
result = alphaFix(backdrop, source, result)
proc blendLighten(backdrop, source: ColorRGBA): ColorRGBA =
blendLightenFloats(backdrop.color, source.color).rgba
result.r = max(backdrop.r, source.r)
result.g = max(backdrop.g, source.g)
result.b = max(backdrop.b, source.b)
result = alphaFix(backdrop, source, result)
proc blendScreen(backdrop, source: ColorRGBA): ColorRGBA =
blendScreenFloats(backdrop.color, source.color).rgba
result.r = screen(backdrop.r, source.r)
result.g = screen(backdrop.g, source.g)
result.b = screen(backdrop.b, source.b)
result = alphaFix(backdrop, source, result)
proc blendLinearDodge(backdrop, source: ColorRGBA): ColorRGBA =
blendLinearDodgeFloats(backdrop.color, source.color).rgba
result.r = min(backdrop.r.uint32 + source.r, 255).uint8
result.g = min(backdrop.g.uint32 + source.g, 255).uint8
result.b = min(backdrop.b.uint32 + source.b, 255).uint8
result = alphaFix(backdrop, source, result)
proc blendColorDodge(backdrop, source: ColorRGBA): ColorRGBA =
blendColorDodgeFloats(backdrop.color, source.color).rgba
proc blend(backdrop, source: uint32): uint8 {.inline.} =
if backdrop == 0:
0.uint8
elif source == 255:
255
else:
min(255, (255 * backdrop) div (255 - source)).uint8
result.r = blend(backdrop.r, source.r)
result.g = blend(backdrop.g, source.g)
result.b = blend(backdrop.b, source.b)
result = alphaFix(backdrop, source, result)
proc blendOverlay(backdrop, source: ColorRGBA): ColorRGBA =
blendOverlayFloats(backdrop.color, source.color).rgba
result.r = hardLight(source.r, backdrop.r)
result.g = hardLight(source.g, backdrop.g)
result.b = hardLight(source.b, backdrop.b)
result = alphaFix(backdrop, source, result)
proc blendHardLight(backdrop, source: ColorRGBA): ColorRGBA =
blendHardLightFloats(backdrop.color, source.color).rgba
result.r = hardLight(backdrop.r, source.r)
result.g = hardLight(backdrop.g, source.g)
result.b = hardLight(backdrop.b, source.b)
result = alphaFix(backdrop, source, result)
proc blendSoftLight(backdrop, source: ColorRGBA): ColorRGBA =
blendSoftLightFloats(backdrop.color, source.color).rgba
# proc softLight(backdrop, source: int32): uint8 {.inline.} =
# ## Pegtop
# (
# ((255 - 2 * source) * backdrop ^ 2) div 255 ^ 2 +
# (2 * source * backdrop) div 255
# ).uint8
let
vb = mm_setr_ps(backdrop.r.float32, backdrop.g.float32, backdrop.b.float32, 0)
vs = mm_setr_ps(source.r.float32, source.g.float32, source.b.float32, 0)
v2 = mm_set1_ps(2)
v255 = mm_set1_ps(255)
v255sq = mm_set1_ps(255 * 255)
vm = ((v255 - v2 * vs) * vb * vb) / v255sq + (v2 * vs * vb) / v255
values = cast[array[4, uint32]](mm_cvtps_epi32(vm))
result.r = values[0].uint8
result.g = values[1].uint8
result.b = values[2].uint8
result = alphaFix(backdrop, source, vb, vs, vm)
proc blendDifference(backdrop, source: ColorRGBA): ColorRGBA =
blendDifferenceFloats(backdrop.color, source.color).rgba
result.r = max(backdrop.r, source.r) - min(backdrop.r, source.r)
result.g = max(backdrop.g, source.g) - min(backdrop.g, source.g)
result.b = max(backdrop.b, source.b) - min(backdrop.b, source.b)
result = alphaFix(backdrop, source, result)
proc blendExclusion(backdrop, source: ColorRGBA): ColorRGBA =
blendExclusionFloats(backdrop.color, source.color).rgba
proc blend(backdrop, source: int32): uint8 {.inline.} =
max(0, backdrop + source - (2 * backdrop * source) div 255).uint8
result.r = blend(backdrop.r.int32, source.r.int32)
result.g = blend(backdrop.g.int32, source.g.int32)
result.b = blend(backdrop.b.int32, source.b.int32)
result = alphaFix(backdrop, source, result)
proc blendColor(backdrop, source: ColorRGBA): ColorRGBA =
blendColorFloats(backdrop.color, source.color).rgba

View file

@ -1,73 +1,185 @@
import benchy, chroma, pixie, vmath
import benchy, chroma, vmath
include pixie/blends
const iterations = 1_000_000
let
a = newImage(1000, 1000)
b = newImage(1000, 1000)
a = rgba(100, 200, 100, 255)
b = rgba(25, 33, 100, 127)
b.fill(rgba(127, 127, 127, 255))
timeIt "blendNormal":
for i in 0 ..< iterations:
keep blendNormal(a, b)
timeIt "bmNormal":
a.draw(b, vec2(0, 0), bmNormal)
timeIt "blendNormalFloats":
for i in 0 ..< iterations:
keep blendNormalFloats(a.color, b.color).rgba
timeIt "bmDarken":
a.draw(b, vec2(0, 0), bmDarken)
timeIt "blendDarken":
for i in 0 ..< iterations:
keep blendDarken(a, b)
timeIt "bmMultiply":
a.draw(b, vec2(0, 0), bmMultiply)
timeIt "blendDarkenFloats":
for i in 0 ..< iterations:
keep blendDarkenFloats(a.color, b.color).rgba
timeIt "bmLinearBurn":
a.draw(b, vec2(0, 0), bmLinearBurn)
timeIt "blendMultiply":
for i in 0 ..< iterations:
keep blendMultiply(a, b)
timeIt "bmColorBurn":
a.draw(b, vec2(0, 0), bmColorBurn)
timeIt "blendMultiplyFloats":
for i in 0 ..< iterations:
keep blendMultiplyFloats(a.color, b.color).rgba
timeIt "bmLighten":
a.draw(b, vec2(0, 0), bmLighten)
timeIt "blendLinearBurn":
for i in 0 ..< iterations:
keep blendLinearBurn(a, b)
timeIt "bmScreen":
a.draw(b, vec2(0, 0), bmScreen)
timeIt "blendLinearBurnFloats":
for i in 0 ..< iterations:
keep blendLinearBurnFloats(a.color, b.color).rgba
timeIt "bmLinearDodge":
a.draw(b, vec2(0, 0), bmLinearDodge)
timeIt "blendColorBurn":
for i in 0 ..< iterations:
keep blendColorBurn(a, b)
timeIt "bmColorDodge":
a.draw(b, vec2(0, 0), bmColorDodge)
timeIt "blendColorBurnFloats":
for i in 0 ..< iterations:
keep blendColorBurnFloats(a.color, b.color).rgba
timeIt "bmOverlay":
a.draw(b, vec2(0, 0), bmOverlay)
timeIt "blendLighten":
for i in 0 ..< iterations:
keep blendLighten(a, b)
timeIt "bmSoftLight":
a.draw(b, vec2(0, 0), bmSoftLight)
timeIt "blendLightenFloats":
for i in 0 ..< iterations:
keep blendLightenFloats(a.color, b.color).rgba
timeIt "bmHardLight":
a.draw(b, vec2(0, 0), bmHardLight)
timeIt "blendScreen":
for i in 0 ..< iterations:
keep blendScreen(a, b)
timeIt "bmDifference":
a.draw(b, vec2(0, 0), bmDifference)
timeIt "blendScreenFloats":
for i in 0 ..< iterations:
keep blendScreenFloats(a.color, b.color).rgba
timeIt "bmExclusion":
a.draw(b, vec2(0, 0), bmExclusion)
timeIt "blendLinearDodge":
for i in 0 ..< iterations:
keep blendLinearDodge(a, b)
timeIt "bmHue":
a.draw(b, vec2(0, 0), bmHue)
timeIt "blendLinearDodgeFloats":
for i in 0 ..< iterations:
keep blendLinearDodgeFloats(a.color, b.color).rgba
timeIt "bmSaturation":
a.draw(b, vec2(0, 0), bmSaturation)
timeIt "blendColorDodge":
for i in 0 ..< iterations:
keep blendColorDodge(a, b)
timeIt "bmColor":
a.draw(b, vec2(0, 0), bmColor)
timeIt "blendColorDodgeFloats":
for i in 0 ..< iterations:
keep blendColorDodgeFloats(a.color, b.color).rgba
timeIt "bmLuminosity":
a.draw(b, vec2(0, 0), bmLuminosity)
timeIt "blendOverlay":
for i in 0 ..< iterations:
keep blendOverlay(a, b)
timeIt "bmMask":
a.draw(b, vec2(0, 0), bmMask)
timeIt "blendOverlayFloats":
for i in 0 ..< iterations:
keep blendOverlayFloats(a.color, b.color).rgba
timeIt "bmSubtractMask":
a.draw(b, vec2(0, 0), bmSubtractMask)
timeIt "blendSoftLight":
for i in 0 ..< iterations:
keep blendSoftLight(a, b)
timeIt "bmIntersectMask":
a.draw(b, vec2(0, 0), bmIntersectMask)
timeIt "blendSoftLightFloats":
for i in 0 ..< iterations:
keep blendSoftLightFloats(a.color, b.color).rgba
timeIt "bmExcludeMask":
a.draw(b, vec2(0, 0), bmExcludeMask)
timeIt "blendHardLight":
for i in 0 ..< iterations:
keep blendHardLight(a, b)
timeIt "blendHardLightFloats":
for i in 0 ..< iterations:
keep blendHardLightFloats(a.color, b.color).rgba
timeIt "blendDifference":
for i in 0 ..< iterations:
keep blendDifference(a, b)
timeIt "blendDifferenceFloats":
for i in 0 ..< iterations:
keep blendDifferenceFloats(a.color, b.color).rgba
timeIt "blendExclusion":
for i in 0 ..< iterations:
keep blendExclusion(a, b)
timeIt "blendExclusionFloats":
for i in 0 ..< iterations:
keep blendExclusionFloats(a.color, b.color).rgba
timeIt "blendHue":
for i in 0 ..< iterations:
keep blendHue(a, b)
timeIt "blendHueFloats":
for i in 0 ..< iterations:
keep blendHueFloats(a.color, b.color).rgba
timeIt "blendSaturation":
for i in 0 ..< iterations:
keep blendSaturation(a, b)
timeIt "blendSaturationFloats":
for i in 0 ..< iterations:
keep blendSaturationFloats(a.color, b.color).rgba
timeIt "blendColor":
for i in 0 ..< iterations:
keep blendColor(a, b)
timeIt "blendColorFloats":
for i in 0 ..< iterations:
keep blendColorFloats(a.color, b.color).rgba
timeIt "blendLuminosity":
for i in 0 ..< iterations:
keep blendLuminosity(a, b)
timeIt "blendLuminosityFloats":
for i in 0 ..< iterations:
keep blendLuminosityFloats(a.color, b.color).rgba
timeIt "blendMask":
for i in 0 ..< iterations:
keep blendMask(a, b)
timeIt "blendMaskFloats":
for i in 0 ..< iterations:
keep blendMaskFloats(a.color, b.color).rgba
timeIt "blendSubtractMask":
for i in 0 ..< iterations:
keep blendSubtractMask(a, b)
timeIt "blendSubtractMaskFloats":
for i in 0 ..< iterations:
keep blendSubtractMaskFloats(a.color, b.color).rgba
timeIt "blendIntersectMask":
for i in 0 ..< iterations:
keep blendIntersectMask(a, b)
timeIt "blendIntersectMaskFloats":
for i in 0 ..< iterations:
keep blendIntersectMaskFloats(a.color, b.color).rgba
timeIt "blendExcludeMask":
for i in 0 ..< iterations:
keep blendExcludeMask(a, b)
timeIt "blendExcludeMaskFloats":
for i in 0 ..< iterations:
keep blendExcludeMaskFloats(a.color, b.color).rgba