opaque fast path
This commit is contained in:
parent
a5c2e08000
commit
a6ed55592c
4 changed files with 54 additions and 29 deletions
|
@ -760,7 +760,9 @@ proc drawUber(
|
||||||
dy *= 2
|
dy *= 2
|
||||||
filterBy2 *= 2
|
filterBy2 *= 2
|
||||||
|
|
||||||
let smooth = not(
|
let
|
||||||
|
hasRotation = not(dx == vec2(1, 0) and dy == vec2(0, 1))
|
||||||
|
smooth = not(
|
||||||
dx.length == 1.0 and
|
dx.length == 1.0 and
|
||||||
dy.length == 1.0 and
|
dy.length == 1.0 and
|
||||||
transform[2, 0].fractional == 0.0 and
|
transform[2, 0].fractional == 0.0 and
|
||||||
|
@ -783,14 +785,17 @@ proc drawUber(
|
||||||
let masker = blendMode.masker()
|
let masker = blendMode.masker()
|
||||||
|
|
||||||
if blendMode == bmMask:
|
if blendMode == bmMask:
|
||||||
if yMin > 0:
|
if yMin > 0 and yMin < a.height:
|
||||||
zeroMem(a.data[0].addr, 4 * yMin * a.width)
|
zeroMem(a.data[0].addr, 4 * yMin * a.width)
|
||||||
|
|
||||||
|
when type(a) is Image and type(b) is Image:
|
||||||
|
let opaqueFastPath = blendMode in {bmNormal, bmOverwrite} and b.isOpaque()
|
||||||
|
|
||||||
for y in yMin ..< yMax:
|
for y in yMin ..< yMax:
|
||||||
# Determine where we should start and stop drawing in the x dimension
|
# Determine where we should start and stop drawing in the x dimension
|
||||||
var
|
var
|
||||||
xMin = a.width
|
xMin = a.width.float32
|
||||||
xMax = 0
|
xMax = 0.float32
|
||||||
for yOffset in [0.float32, 1]:
|
for yOffset in [0.float32, 1]:
|
||||||
let scanLine = Line(
|
let scanLine = Line(
|
||||||
a: vec2(-1000, y.float32 + yOffset),
|
a: vec2(-1000, y.float32 + yOffset),
|
||||||
|
@ -799,21 +804,28 @@ proc drawUber(
|
||||||
for segment in perimeter:
|
for segment in perimeter:
|
||||||
var at: Vec2
|
var at: Vec2
|
||||||
if scanline.intersects(segment, at) and segment.to != at:
|
if scanline.intersects(segment, at) and segment.to != at:
|
||||||
xMin = min(xMin, at.x.floor.int)
|
xMin = min(xMin, at.x)
|
||||||
xMax = max(xMax, at.x.ceil.int)
|
xMax = max(xMax, at.x)
|
||||||
|
|
||||||
xMin = xMin.clamp(0, a.width)
|
var xStart, xStop: int
|
||||||
xMax = xMax.clamp(0, a.width)
|
if hasRotation or smooth:
|
||||||
|
xStart = xMin.floor.int
|
||||||
|
xStop = xMax.ceil.int
|
||||||
|
else:
|
||||||
|
xStart = xMin.round().int
|
||||||
|
xStop = xMax.round().int
|
||||||
|
xStart = xStart.clamp(0, a.width)
|
||||||
|
xStop = xStop.clamp(0, a.width)
|
||||||
|
|
||||||
if blendMode == bmMask:
|
if blendMode == bmMask:
|
||||||
if xMin > 0:
|
if xStart > 0 and xStart < a.width:
|
||||||
zeroMem(a.data[a.dataIndex(0, y)].addr, 4 * xMin)
|
zeroMem(a.data[a.dataIndex(0, y)].addr, 4 * xStart)
|
||||||
|
|
||||||
if smooth:
|
if smooth:
|
||||||
var srcPos = p + dx * xMin.float32 + dy * y.float32
|
var srcPos = p + dx * xStart.float32 + dy * y.float32
|
||||||
srcPos = vec2(srcPos.x - h, srcPos.y - h)
|
srcPos = vec2(srcPos.x - h, srcPos.y - h)
|
||||||
|
|
||||||
for x in xMin ..< xMax:
|
for x in xStart ..< xStop:
|
||||||
when type(a) is Image:
|
when type(a) is Image:
|
||||||
let backdrop = a.unsafe[x, y]
|
let backdrop = a.unsafe[x, y]
|
||||||
when type(b) is Image:
|
when type(b) is Image:
|
||||||
|
@ -836,14 +848,27 @@ proc drawUber(
|
||||||
srcPos += dx
|
srcPos += dx
|
||||||
|
|
||||||
else:
|
else:
|
||||||
var x = xMin
|
var x = xStart
|
||||||
|
if not hasRotation:
|
||||||
|
when type(a) is Image and type(b) is Image:
|
||||||
|
if opaqueFastPath:
|
||||||
|
let
|
||||||
|
srcPos = p + dx * x.float32 + dy * y.float32
|
||||||
|
sx = srcPos.x.int
|
||||||
|
sy = srcPos.y.int
|
||||||
|
copyMem(
|
||||||
|
a.data[a.dataIndex(x, y)].addr,
|
||||||
|
b.data[b.dataIndex(sx, sy)].addr,
|
||||||
|
(xStop - xStart) * 4
|
||||||
|
)
|
||||||
|
continue
|
||||||
|
|
||||||
when defined(amd64) and not defined(pixieNoSimd):
|
when defined(amd64) and not defined(pixieNoSimd):
|
||||||
if dx == vec2(1, 0) and dy == vec2(0, 1):
|
# Check we are not rotated
|
||||||
# Check we are not rotated before using SIMD blends
|
|
||||||
when type(a) is Image:
|
when type(a) is Image:
|
||||||
if blendMode.hasSimdBlender():
|
if blendMode.hasSimdBlender():
|
||||||
let blenderSimd = blendMode.blenderSimd()
|
let blenderSimd = blendMode.blenderSimd()
|
||||||
for _ in 0 ..< (xMax - xMin) div 16:
|
for _ in 0 ..< (xStop - xStart) div 16:
|
||||||
let
|
let
|
||||||
srcPos = p + dx * x.float32 + dy * y.float32
|
srcPos = p + dx * x.float32 + dy * y.float32
|
||||||
sx = srcPos.x.int
|
sx = srcPos.x.int
|
||||||
|
@ -873,7 +898,7 @@ proc drawUber(
|
||||||
else: # is a Mask
|
else: # is a Mask
|
||||||
if blendMode.hasSimdMasker():
|
if blendMode.hasSimdMasker():
|
||||||
let maskerSimd = blendMode.maskerSimd()
|
let maskerSimd = blendMode.maskerSimd()
|
||||||
for _ in 0 ..< (xMax - xMin) div 16:
|
for _ in 0 ..< (xStop - xStart) div 16:
|
||||||
let
|
let
|
||||||
srcPos = p + dx * x.float32 + dy * y.float32
|
srcPos = p + dx * x.float32 + dy * y.float32
|
||||||
sx = srcPos.x.int
|
sx = srcPos.x.int
|
||||||
|
@ -914,7 +939,7 @@ proc drawUber(
|
||||||
|
|
||||||
case blendMode:
|
case blendMode:
|
||||||
of bmOverwrite:
|
of bmOverwrite:
|
||||||
for x in x ..< xMax:
|
for x in x ..< xStop:
|
||||||
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
||||||
when type(a) is Image:
|
when type(a) is Image:
|
||||||
when type(b) is Image:
|
when type(b) is Image:
|
||||||
|
@ -932,7 +957,7 @@ proc drawUber(
|
||||||
a.unsafe[x, y] = source
|
a.unsafe[x, y] = source
|
||||||
srcPos += dx
|
srcPos += dx
|
||||||
of bmNormal:
|
of bmNormal:
|
||||||
for x in x ..< xMax:
|
for x in x ..< xStop:
|
||||||
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
||||||
when type(a) is Image:
|
when type(a) is Image:
|
||||||
when type(b) is Image:
|
when type(b) is Image:
|
||||||
|
@ -958,7 +983,7 @@ proc drawUber(
|
||||||
a.unsafe[x, y] = blendAlpha(backdrop, source)
|
a.unsafe[x, y] = blendAlpha(backdrop, source)
|
||||||
srcPos += dx
|
srcPos += dx
|
||||||
of bmMask:
|
of bmMask:
|
||||||
for x in x ..< xMax:
|
for x in x ..< xStop:
|
||||||
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
||||||
when type(a) is Image:
|
when type(a) is Image:
|
||||||
when type(b) is Image:
|
when type(b) is Image:
|
||||||
|
@ -982,7 +1007,7 @@ proc drawUber(
|
||||||
a.unsafe[x, y] = maskMaskInline(backdrop, source)
|
a.unsafe[x, y] = maskMaskInline(backdrop, source)
|
||||||
srcPos += dx
|
srcPos += dx
|
||||||
else:
|
else:
|
||||||
for x in x ..< xMax:
|
for x in x ..< xStop:
|
||||||
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
|
||||||
when type(a) is Image:
|
when type(a) is Image:
|
||||||
let backdrop = a.unsafe[x, y]
|
let backdrop = a.unsafe[x, y]
|
||||||
|
@ -1005,8 +1030,8 @@ proc drawUber(
|
||||||
srcPos += dx
|
srcPos += dx
|
||||||
|
|
||||||
if blendMode == bmMask:
|
if blendMode == bmMask:
|
||||||
if a.width - xMax > 0:
|
if a.width - xStop > 0:
|
||||||
zeroMem(a.data[a.dataIndex(xMax, y)].addr, 4 * (a.width - xMax))
|
zeroMem(a.data[a.dataIndex(xStop, y)].addr, 4 * (a.width - xStop))
|
||||||
|
|
||||||
if blendMode == bmMask:
|
if blendMode == bmMask:
|
||||||
if a.height - yMax > 0:
|
if a.height - yMax > 0:
|
||||||
|
|
Binary file not shown.
Before Width: | Height: | Size: 783 KiB After Width: | Height: | Size: 783 KiB |
Binary file not shown.
Before Width: | Height: | Size: 3.3 MiB After Width: | Height: | Size: 3.3 MiB |
Binary file not shown.
Before Width: | Height: | Size: 9.7 KiB After Width: | Height: | Size: 9.8 KiB |
Loading…
Reference in a new issue