move mask ceil simd out
This commit is contained in:
parent
8a07e3cf9b
commit
b706f93ee5
2 changed files with 25 additions and 14 deletions
|
@ -286,21 +286,16 @@ proc spread*(mask: Mask, spread: float32) {.raises: [PixieError].} =
|
||||||
|
|
||||||
proc ceil*(mask: Mask) {.raises: [].} =
|
proc ceil*(mask: Mask) {.raises: [].} =
|
||||||
## A value of 0 stays 0. Anything else turns into 255.
|
## A value of 0 stays 0. Anything else turns into 255.
|
||||||
var i: int
|
when allowSimd and compiles(invertImageSimd):
|
||||||
when defined(amd64) and allowSimd:
|
ceilMaskSimd(
|
||||||
let
|
cast[ptr UncheckedArray[uint8]](mask.data[0].addr),
|
||||||
zeroVec = mm_setzero_si128()
|
mask.data.len
|
||||||
vec255 = mm_set1_epi8(255)
|
)
|
||||||
for _ in 0 ..< mask.data.len div 16:
|
return
|
||||||
var values = mm_loadu_si128(mask.data[i].addr)
|
|
||||||
values = mm_cmpeq_epi8(values, zeroVec)
|
|
||||||
values = mm_andnot_si128(values, vec255)
|
|
||||||
mm_storeu_si128(mask.data[i].addr, values)
|
|
||||||
i += 16
|
|
||||||
|
|
||||||
for j in i ..< mask.data.len:
|
for i in 0 ..< mask.data.len:
|
||||||
if mask.data[j] != 0:
|
if mask.data[i] != 0:
|
||||||
mask.data[j] = 255
|
mask.data[i] = 255
|
||||||
|
|
||||||
proc blur*(mask: Mask, radius: float32, outOfBounds: uint8 = 0) {.raises: [PixieError].} =
|
proc blur*(mask: Mask, radius: float32, outOfBounds: uint8 = 0) {.raises: [PixieError].} =
|
||||||
## Applies Gaussian blur to the image given a radius.
|
## Applies Gaussian blur to the image given a radius.
|
||||||
|
|
|
@ -267,3 +267,19 @@ when defined(amd64):
|
||||||
|
|
||||||
for j in i ..< len:
|
for j in i ..< len:
|
||||||
data[j] = 255 - data[j]
|
data[j] = 255 - data[j]
|
||||||
|
|
||||||
|
proc ceilMaskSimd*(data: ptr UncheckedArray[uint8], len: int) =
|
||||||
|
var i: int
|
||||||
|
let
|
||||||
|
zeroVec = mm_setzero_si128()
|
||||||
|
vec255 = mm_set1_epi8(255)
|
||||||
|
for _ in 0 ..< len div 16:
|
||||||
|
var values = mm_loadu_si128(data[i].addr)
|
||||||
|
values = mm_cmpeq_epi8(values, zeroVec)
|
||||||
|
values = mm_andnot_si128(values, vec255)
|
||||||
|
mm_storeu_si128(data[i].addr, values)
|
||||||
|
i += 16
|
||||||
|
|
||||||
|
for i in i ..< len:
|
||||||
|
if data[i] != 0:
|
||||||
|
data[i] = 255
|
||||||
|
|
Loading…
Reference in a new issue