aligned rgba fill
This commit is contained in:
parent
acd5a13763
commit
cdc52f31ab
1 changed files with 10 additions and 4 deletions
|
@ -71,11 +71,17 @@ proc fillUnsafe*(
|
||||||
else:
|
else:
|
||||||
var i = start
|
var i = start
|
||||||
when defined(amd64) and allowSimd:
|
when defined(amd64) and allowSimd:
|
||||||
|
# Align to 16 bytes
|
||||||
|
while i < (start + len) and (cast[uint](data[i].addr) and 15) != 0:
|
||||||
|
data[i] = rgbx
|
||||||
|
inc i
|
||||||
# When supported, SIMD fill until we run out of room
|
# When supported, SIMD fill until we run out of room
|
||||||
let colorVec = mm_set1_epi32(cast[int32](rgbx))
|
let
|
||||||
for _ in 0 ..< len div 8:
|
colorVec = mm_set1_epi32(cast[int32](rgbx))
|
||||||
mm_storeu_si128(data[i + 0].addr, colorVec)
|
remaining = start + len - i
|
||||||
mm_storeu_si128(data[i + 4].addr, colorVec)
|
for _ in 0 ..< remaining div 8:
|
||||||
|
mm_store_si128(data[i + 0].addr, colorVec)
|
||||||
|
mm_store_si128(data[i + 4].addr, colorVec)
|
||||||
i += 8
|
i += 8
|
||||||
else:
|
else:
|
||||||
when sizeof(int) == 8:
|
when sizeof(int) == 8:
|
||||||
|
|
Loading…
Reference in a new issue