opaque fast path

This commit is contained in:
Ryan Oldenburg 2021-12-13 03:55:05 -06:00
parent a5c2e08000
commit a6ed55592c
4 changed files with 54 additions and 29 deletions

View file

@ -760,7 +760,9 @@ proc drawUber(
dy *= 2 dy *= 2
filterBy2 *= 2 filterBy2 *= 2
let smooth = not( let
hasRotation = not(dx == vec2(1, 0) and dy == vec2(0, 1))
smooth = not(
dx.length == 1.0 and dx.length == 1.0 and
dy.length == 1.0 and dy.length == 1.0 and
transform[2, 0].fractional == 0.0 and transform[2, 0].fractional == 0.0 and
@ -783,14 +785,17 @@ proc drawUber(
let masker = blendMode.masker() let masker = blendMode.masker()
if blendMode == bmMask: if blendMode == bmMask:
if yMin > 0: if yMin > 0 and yMin < a.height:
zeroMem(a.data[0].addr, 4 * yMin * a.width) zeroMem(a.data[0].addr, 4 * yMin * a.width)
when type(a) is Image and type(b) is Image:
let opaqueFastPath = blendMode in {bmNormal, bmOverwrite} and b.isOpaque()
for y in yMin ..< yMax: for y in yMin ..< yMax:
# Determine where we should start and stop drawing in the x dimension # Determine where we should start and stop drawing in the x dimension
var var
xMin = a.width xMin = a.width.float32
xMax = 0 xMax = 0.float32
for yOffset in [0.float32, 1]: for yOffset in [0.float32, 1]:
let scanLine = Line( let scanLine = Line(
a: vec2(-1000, y.float32 + yOffset), a: vec2(-1000, y.float32 + yOffset),
@ -799,21 +804,28 @@ proc drawUber(
for segment in perimeter: for segment in perimeter:
var at: Vec2 var at: Vec2
if scanline.intersects(segment, at) and segment.to != at: if scanline.intersects(segment, at) and segment.to != at:
xMin = min(xMin, at.x.floor.int) xMin = min(xMin, at.x)
xMax = max(xMax, at.x.ceil.int) xMax = max(xMax, at.x)
xMin = xMin.clamp(0, a.width) var xStart, xStop: int
xMax = xMax.clamp(0, a.width) if hasRotation or smooth:
xStart = xMin.floor.int
xStop = xMax.ceil.int
else:
xStart = xMin.round().int
xStop = xMax.round().int
xStart = xStart.clamp(0, a.width)
xStop = xStop.clamp(0, a.width)
if blendMode == bmMask: if blendMode == bmMask:
if xMin > 0: if xStart > 0 and xStart < a.width:
zeroMem(a.data[a.dataIndex(0, y)].addr, 4 * xMin) zeroMem(a.data[a.dataIndex(0, y)].addr, 4 * xStart)
if smooth: if smooth:
var srcPos = p + dx * xMin.float32 + dy * y.float32 var srcPos = p + dx * xStart.float32 + dy * y.float32
srcPos = vec2(srcPos.x - h, srcPos.y - h) srcPos = vec2(srcPos.x - h, srcPos.y - h)
for x in xMin ..< xMax: for x in xStart ..< xStop:
when type(a) is Image: when type(a) is Image:
let backdrop = a.unsafe[x, y] let backdrop = a.unsafe[x, y]
when type(b) is Image: when type(b) is Image:
@ -836,14 +848,27 @@ proc drawUber(
srcPos += dx srcPos += dx
else: else:
var x = xMin var x = xStart
if not hasRotation:
when type(a) is Image and type(b) is Image:
if opaqueFastPath:
let
srcPos = p + dx * x.float32 + dy * y.float32
sx = srcPos.x.int
sy = srcPos.y.int
copyMem(
a.data[a.dataIndex(x, y)].addr,
b.data[b.dataIndex(sx, sy)].addr,
(xStop - xStart) * 4
)
continue
when defined(amd64) and not defined(pixieNoSimd): when defined(amd64) and not defined(pixieNoSimd):
if dx == vec2(1, 0) and dy == vec2(0, 1): # Check we are not rotated
# Check we are not rotated before using SIMD blends
when type(a) is Image: when type(a) is Image:
if blendMode.hasSimdBlender(): if blendMode.hasSimdBlender():
let blenderSimd = blendMode.blenderSimd() let blenderSimd = blendMode.blenderSimd()
for _ in 0 ..< (xMax - xMin) div 16: for _ in 0 ..< (xStop - xStart) div 16:
let let
srcPos = p + dx * x.float32 + dy * y.float32 srcPos = p + dx * x.float32 + dy * y.float32
sx = srcPos.x.int sx = srcPos.x.int
@ -873,7 +898,7 @@ proc drawUber(
else: # is a Mask else: # is a Mask
if blendMode.hasSimdMasker(): if blendMode.hasSimdMasker():
let maskerSimd = blendMode.maskerSimd() let maskerSimd = blendMode.maskerSimd()
for _ in 0 ..< (xMax - xMin) div 16: for _ in 0 ..< (xStop - xStart) div 16:
let let
srcPos = p + dx * x.float32 + dy * y.float32 srcPos = p + dx * x.float32 + dy * y.float32
sx = srcPos.x.int sx = srcPos.x.int
@ -914,7 +939,7 @@ proc drawUber(
case blendMode: case blendMode:
of bmOverwrite: of bmOverwrite:
for x in x ..< xMax: for x in x ..< xStop:
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32) let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
when type(a) is Image: when type(a) is Image:
when type(b) is Image: when type(b) is Image:
@ -932,7 +957,7 @@ proc drawUber(
a.unsafe[x, y] = source a.unsafe[x, y] = source
srcPos += dx srcPos += dx
of bmNormal: of bmNormal:
for x in x ..< xMax: for x in x ..< xStop:
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32) let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
when type(a) is Image: when type(a) is Image:
when type(b) is Image: when type(b) is Image:
@ -958,7 +983,7 @@ proc drawUber(
a.unsafe[x, y] = blendAlpha(backdrop, source) a.unsafe[x, y] = blendAlpha(backdrop, source)
srcPos += dx srcPos += dx
of bmMask: of bmMask:
for x in x ..< xMax: for x in x ..< xStop:
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32) let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
when type(a) is Image: when type(a) is Image:
when type(b) is Image: when type(b) is Image:
@ -982,7 +1007,7 @@ proc drawUber(
a.unsafe[x, y] = maskMaskInline(backdrop, source) a.unsafe[x, y] = maskMaskInline(backdrop, source)
srcPos += dx srcPos += dx
else: else:
for x in x ..< xMax: for x in x ..< xStop:
let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32) let samplePos = ivec2((srcPos.x - h).int32, (srcPos.y - h).int32)
when type(a) is Image: when type(a) is Image:
let backdrop = a.unsafe[x, y] let backdrop = a.unsafe[x, y]
@ -1005,8 +1030,8 @@ proc drawUber(
srcPos += dx srcPos += dx
if blendMode == bmMask: if blendMode == bmMask:
if a.width - xMax > 0: if a.width - xStop > 0:
zeroMem(a.data[a.dataIndex(xMax, y)].addr, 4 * (a.width - xMax)) zeroMem(a.data[a.dataIndex(xStop, y)].addr, 4 * (a.width - xStop))
if blendMode == bmMask: if blendMode == bmMask:
if a.height - yMax > 0: if a.height - yMax > 0:

Binary file not shown.

Before

Width:  |  Height:  |  Size: 783 KiB

After

Width:  |  Height:  |  Size: 783 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 3.3 MiB

After

Width:  |  Height:  |  Size: 3.3 MiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 9.7 KiB

After

Width:  |  Height:  |  Size: 9.8 KiB