Merge pull request #426 from guzba/master

jpeg pass
This commit is contained in:
treeform 2022-05-25 22:04:18 -07:00 committed by GitHub
commit b6b2a27782
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
5 changed files with 122 additions and 106 deletions

View file

@ -1,6 +1,9 @@
import pixie/common, pixie/images, pixie/masks, sequtils, strutils, chroma, import pixie/common, pixie/images, pixie/masks, sequtils, strutils, chroma,
std/decls, flatty/binny std/decls, flatty/binny
when defined(amd64) and not defined(pixieNoSimd):
import nimsimd/sse2
# This JPEG decoder is loosely based on stb_image which is public domain. # This JPEG decoder is loosely based on stb_image which is public domain.
# JPEG is a complex format, this decoder only supports the most common features: # JPEG is a complex format, this decoder only supports the most common features:
@ -38,10 +41,6 @@ const
0.uint32, 1, 3, 7, 15, 31, 63, 127, 255, 511, 0.uint32, 1, 3, 7, 15, 31, 63, 127, 255, 511,
1023, 2047, 4095, 8191, 16383, 32767, 65535 1023, 2047, 4095, 8191, 16383, 32767, 65535
] ]
biases = [ # (-1 shl n) + 1
0.int32, -1, -3, -7, -15, -31, -63, -127, -255,
-511, -1023, -2047, -4095, -8191, -16383, -32767
]
type type
Huffman = object Huffman = object
@ -65,25 +64,26 @@ type
channel: Mask channel: Mask
DecoderState = object DecoderState = object
buffer: string buffer: ptr UncheckedArray[uint8]
pos, bitsBuffered: int len, pos: int
bitsBuffered: int
bitBuffer: uint32 bitBuffer: uint32
hitEnd: bool
imageHeight, imageWidth: int imageHeight, imageWidth: int
progressive: bool
quantizationTables: array[4, array[64, uint8]] quantizationTables: array[4, array[64, uint8]]
huffmanTables: array[2, array[4, Huffman]] # 0 = DC, 1 = AC huffmanTables: array[2, array[4, Huffman]] # 0 = DC, 1 = AC
components: seq[Component] components: seq[Component]
maxYScale, maxXScale: int
mcuWidth, mcuHeight, numMcuWide, numMcuHigh: int
orientation: int
scanComponents: int scanComponents: int
spectralStart, spectralEnd: int spectralStart, spectralEnd: int
successiveApproxLow, successiveApproxHigh: int successiveApproxLow, successiveApproxHigh: int
maxYScale, maxXScale: int
mcuWidth, mcuHeight, numMcuWide, numMcuHigh: int
componentOrder: seq[int] componentOrder: seq[int]
progressive: bool
restartInterval: int restartInterval: int
todoBeforeRestart: int todoBeforeRestart: int
eobRun: int eobRun: int
orientation: int hitEnd: bool
when defined(release): when defined(release):
{.push checks: off.} {.push checks: off.}
@ -92,7 +92,7 @@ template failInvalid(reason = "unable to load") =
## Throw exception with a reason. ## Throw exception with a reason.
raise newException(PixieError, "Invalid JPEG, " & reason) raise newException(PixieError, "Invalid JPEG, " & reason)
template clampByte(x: int32): uint8 = proc clampByte(x: int32): uint8 {.inline.} =
## Clamp integer into byte range. ## Clamp integer into byte range.
# clamp(x, 0, 0xFF).uint8 # clamp(x, 0, 0xFF).uint8
let let
@ -102,33 +102,42 @@ template clampByte(x: int32): uint8 =
proc readUint8(state: var DecoderState): uint8 = proc readUint8(state: var DecoderState): uint8 =
## Reads a byte from the input stream. ## Reads a byte from the input stream.
if state.pos >= state.buffer.len: if state.pos >= state.len:
failInvalid() failInvalid()
result = cast[uint8](state.buffer[state.pos]) result = state.buffer[state.pos]
inc state.pos inc state.pos
proc readUint16be(state: var DecoderState): uint16 = proc readUint16be(state: var DecoderState): uint16 =
## Reads uint16 big-endian from the input stream. ## Reads uint16 big-endian from the input stream.
(state.readUint8().uint16 shl 8) or state.readUint8() if state.pos + 2 > state.len:
failInvalid()
result =
(state.buffer[state.pos].uint16 shl 8) or
state.buffer[state.pos + 1]
state.pos += 2
proc readUint32be(state: var DecoderState): uint32 = proc readUint32be(state: var DecoderState): uint32 =
## Reads uint32 big-endian from the input stream. ## Reads uint32 big-endian from the input stream.
return if state.pos + 4 > state.len:
(state.readUint8().uint32 shl 24) or failInvalid()
(state.readUint8().uint32 shl 16) or result =
(state.readUint8().uint32 shl 8) or (state.buffer[state.pos + 0].uint32 shl 24) or
state.readUint8().uint32 (state.buffer[state.pos + 1].uint32 shl 16) or
(state.buffer[state.pos + 2].uint32 shl 8) or
state.buffer[state.pos + 3]
state.pos += 4
proc readStr(state: var DecoderState, n: int): string = proc readStr(state: var DecoderState, n: int): string =
## Reads n number of bytes as a string. ## Reads n number of bytes as a string.
if state.pos + n > state.buffer.len: if state.pos + n > state.len:
failInvalid() failInvalid()
result = state.buffer[state.pos ..< state.pos + n] result.setLen(n)
copyMem(result[0].addr, state.buffer[state.pos].addr, n)
state.pos += n state.pos += n
proc skipBytes(state: var DecoderState, n: int) = proc skipBytes(state: var DecoderState, n: int) =
## Skips a number of bytes. ## Skips a number of bytes.
if state.pos + n > state.buffer.len: if state.pos + n > state.len:
failInvalid() failInvalid()
state.pos += n state.pos += n
@ -266,7 +275,7 @@ proc decodeSOF0(state: var DecoderState) =
if quantizationTableId > 3: if quantizationTableId > 3:
failInvalid("invalid quantization table id") failInvalid("invalid quantization table id")
if vertical == 0 or vertical > 4 or horizontal == 0 or horizontal > 4: if vertical notin {1, 2, 4} or horizontal notin {1, 2, 4}:
failInvalid("invalid component scaling factor") failInvalid("invalid component scaling factor")
component.xScale = vertical.int component.xScale = vertical.int
@ -301,9 +310,9 @@ proc decodeSOF0(state: var DecoderState) =
# Allocate block data structures. # Allocate block data structures.
component.blocks = newSeqWith( component.blocks = newSeqWith(
component.width, state.numMcuWide * component.yScale,
newSeq[array[64, int16]]( newSeq[array[64, int16]](
component.height state.numMcuHigh * component.xScale
) )
) )
@ -314,9 +323,7 @@ proc decodeSOF0(state: var DecoderState) =
if state.progressive: if state.progressive:
component.widthCoeff = component.widthStride div 8 component.widthCoeff = component.widthStride div 8
component.heightCoeff = component.heightStride div 8 component.heightCoeff = component.heightStride div 8
component.coeff.setLen( component.coeff.setLen(component.widthStride * component.heightStride)
component.widthStride * component.heightStride
)
if len != 0: if len != 0:
failInvalid() failInvalid()
@ -384,9 +391,9 @@ proc reset(state: var DecoderState) =
## Rests the decoder state need for restart markers. ## Rests the decoder state need for restart markers.
state.bitBuffer = 0 state.bitBuffer = 0
state.bitsBuffered = 0 state.bitsBuffered = 0
state.hitEnd = false
for component in 0 ..< state.components.len: for component in 0 ..< state.components.len:
state.components[component].dcPred = 0 state.components[component].dcPred = 0
state.hitEnd = false
if state.restartInterval != 0: if state.restartInterval != 0:
state.todoBeforeRestart = state.restartInterval state.todoBeforeRestart = state.restartInterval
else: else:
@ -402,7 +409,7 @@ proc decodeSOS(state: var DecoderState) =
if state.scanComponents > state.components.len: if state.scanComponents > state.components.len:
failInvalid("extra components") failInvalid("extra components")
if state.scanComponents notin [1, 3]: if state.scanComponents notin {1, 3}:
failInvalid("unsupported scan component count") failInvalid("unsupported scan component count")
state.componentOrder.setLen(0) state.componentOrder.setLen(0)
@ -418,11 +425,11 @@ proc decodeSOS(state: var DecoderState) =
failInvalid() failInvalid()
var component: int var component: int
while component < 3: while component < state.components.len:
if state.components[component].id == id: if state.components[component].id == id:
break break
inc component inc component
if component == 3: if component == state.components.len:
failInvalid() # Not found failInvalid() # Not found
state.components[component].huffmanAC = huffmanAC.int state.components[component].huffmanAC = huffmanAC.int
@ -436,8 +443,6 @@ proc decodeSOS(state: var DecoderState) =
state.successiveApproxLow = aa and 15 state.successiveApproxLow = aa and 15
state.successiveApproxHigh = aa shr 4 state.successiveApproxHigh = aa shr 4
state.reset()
if state.progressive: if state.progressive:
if state.spectralStart > 63 or state.spectralEnd > 63: if state.spectralStart > 63 or state.spectralEnd > 63:
failInvalid() failInvalid()
@ -457,9 +462,11 @@ proc decodeSOS(state: var DecoderState) =
if len != 0: if len != 0:
failInvalid() failInvalid()
state.reset()
proc fillBitBuffer(state: var DecoderState) = proc fillBitBuffer(state: var DecoderState) =
## When we are low on bits, we need to call this to populate some more. ## When we are low on bits, we need to call this to populate some more.
while state.bitsBuffered < 24: while state.bitsBuffered <= 24:
let b = let b =
if state.hitEnd: if state.hitEnd:
0.uint32 0.uint32
@ -511,43 +518,38 @@ proc huffmanDecode(state: var DecoderState, tableCurrent, table: int): uint8 =
return huffman.symbols[symbolId] return huffman.symbols[symbolId]
template lrot(value: uint32, shift: int): uint32 = template lrot(value: uint32, shift: int): uint32 =
## Left rotate - used for huffman decoding. ## Left rotate
(value shl shift) or (value shr (32 - shift)) (value shl shift) or (value shr (32 - shift))
proc getBit(state: var DecoderState): int = proc readBit(state: var DecoderState): int =
## Get a single bit. ## Get a single bit.
if state.bitsBuffered < 1: if state.bitsBuffered < 1:
state.fillBitBuffer() state.fillBitBuffer()
let k = state.bitBuffer result = ((state.bitBuffer and cast[uint32](0x80000000)) shr 31).int
state.bitBuffer = state.bitBuffer shl 1 state.bitBuffer = state.bitBuffer shl 1
dec state.bitsBuffered dec state.bitsBuffered
return (k.int and 0x80000000.int)
proc getBitsAsSignedInt(state: var DecoderState, n: int): int = proc readBits(state: var DecoderState, n: int): int =
## Get n number of bits as a signed integer.
# TODO: Investigate why 15 not 16?
if n notin 0 .. 15:
failInvalid()
if state.bitsBuffered < n:
state.fillBitBuffer()
let sign = cast[int32](state.bitBuffer) shr 31
var k = lrot(state.bitBuffer, n)
state.bitBuffer = k and (not bitMasks[n])
k = k and bitMasks[n]
state.bitsBuffered -= n
result = k.int + (biases[n] and (not sign))
proc getBitsAsUnsignedInt(state: var DecoderState, n: int): int =
## Get n number of bits as a unsigned integer. ## Get n number of bits as a unsigned integer.
if n notin 0 .. 16: if n notin 0 .. 16:
failInvalid() failInvalid()
if state.bitsBuffered < n: if state.bitsBuffered < n:
state.fillBitBuffer() state.fillBitBuffer()
var k = lrot(state.bitBuffer, n) let k = lrot(state.bitBuffer, n)
result = (k and bitMasks[n]).int
state.bitBuffer = k and (not bitMasks[n]) state.bitBuffer = k and (not bitMasks[n])
k = k and bitMasks[n]
state.bitsBuffered -= n state.bitsBuffered -= n
return k.int
proc receiveExtend(state: var DecoderState, n: int): int =
## Get n number of bits as a signed integer. See Jpeg spec pages 109 and 114
## for EXTEND and RECEIVE.
var
v = state.readBits(n)
vt = (1 shl (n - 1))
if v < vt:
vt = (-1 shl n) + 1
v = v + vt
return v
proc decodeRegularBlock( proc decodeRegularBlock(
state: var DecoderState, component: int, data: var array[64, int16] state: var DecoderState, component: int, data: var array[64, int16]
@ -561,7 +563,7 @@ proc decodeRegularBlock(
if t == 0: if t == 0:
0 0
else: else:
state.getBitsAsSignedInt(t) state.receiveExtend(t)
dc = state.components[component].dcPred + diff dc = state.components[component].dcPred + diff
state.components[component].dcPred = dc state.components[component].dcPred = dc
data[0] = cast[int16](dc) data[0] = cast[int16](dc)
@ -581,7 +583,7 @@ proc decodeRegularBlock(
if i >= 64: if i >= 64:
failInvalid() failInvalid()
let zig = deZigZag[i] let zig = deZigZag[i]
data[zig] = cast[int16](state.getBitsAsSignedInt(s.int)) data[zig] = cast[int16](state.receiveExtend(s.int))
inc i inc i
proc decodeProgressiveBlock( proc decodeProgressiveBlock(
@ -598,14 +600,14 @@ proc decodeProgressiveBlock(
let let
diff = diff =
if t > 0: if t > 0:
state.getBitsAsSignedInt(t) state.receiveExtend(t)
else: else:
0 0
dc = state.components[component].dcPred + diff dc = state.components[component].dcPred + diff
state.components[component].dcPred = dc state.components[component].dcPred = dc
data[0] = cast[int16](dc * (1 shl state.successiveApproxLow)) data[0] = cast[int16](dc * (1 shl state.successiveApproxLow))
else: else:
if getBit(state) != 0: if state.readBit() != 0:
data[0] = cast[int16](data[0] + (1 shl state.successiveApproxLow)) data[0] = cast[int16](data[0] + (1 shl state.successiveApproxLow))
proc decodeProgressiveContinuationBlock( proc decodeProgressiveContinuationBlock(
@ -632,7 +634,7 @@ proc decodeProgressiveContinuationBlock(
if r < 15: if r < 15:
state.eobRun = 1 shl r state.eobRun = 1 shl r
if r != 0: if r != 0:
state.eobRun += state.getBitsAsUnsignedInt(r) state.eobRun += state.readBits(r)
dec state.eobRun dec state.eobRun
break break
k += 16 k += 16
@ -644,7 +646,7 @@ proc decodeProgressiveContinuationBlock(
inc k inc k
if s >= 15: if s >= 15:
failInvalid() failInvalid()
data[zig] = cast[int16](state.getBitsAsSignedInt(s.int) * (1 shl shift)) data[zig] = cast[int16](state.receiveExtend(s.int) * (1 shl shift))
else: else:
var bit = 1 shl state.successiveApproxLow var bit = 1 shl state.successiveApproxLow
@ -654,7 +656,7 @@ proc decodeProgressiveContinuationBlock(
for k in state.spectralStart ..< state.spectralEnd: for k in state.spectralStart ..< state.spectralEnd:
let zig = deZigZag[k] let zig = deZigZag[k]
if data[zig] != 0: if data[zig] != 0:
if state.getBit() != 0: if state.readBit() != 0:
if (data[zig] and bit) == 0: if (data[zig] and bit) == 0:
if data[zig] > 0: if data[zig] > 0:
data[zig] = cast[int16](data[zig] + bit) data[zig] = cast[int16](data[zig] + bit)
@ -671,14 +673,14 @@ proc decodeProgressiveContinuationBlock(
if r < 15: if r < 15:
state.eobRun = (1 shl r) - 1 state.eobRun = (1 shl r) - 1
if r != 0: if r != 0:
state.eobRun += state.getBitsAsUnsignedInt(r) state.eobRun += state.readBits(r)
r = 64 # force end of block r = 64 # force end of block
else: else:
discard discard
else: else:
if s != 1: if s != 1:
failInvalid("bad huffman code") failInvalid("bad huffman code")
if getBit(state) != 0: if state.readBit() != 0:
s = bit.int s = bit.int
else: else:
s = -bit.int s = -bit.int
@ -687,7 +689,7 @@ proc decodeProgressiveContinuationBlock(
let zig = deZigZag[k] let zig = deZigZag[k]
inc k inc k
if data[zig] != 0: if data[zig] != 0:
if getBit(state) != 0: if state.readBit() != 0:
if (data[zig] and bit) == 0: if (data[zig] and bit) == 0:
if data[zig] > 0: if data[zig] > 0:
data[zig] = cast[int16](data[zig] + bit) data[zig] = cast[int16](data[zig] + bit)
@ -833,14 +835,12 @@ proc checkRestart(state: var DecoderState) =
## Check if we might have run into a restart marker, then deal with it. ## Check if we might have run into a restart marker, then deal with it.
dec state.todoBeforeRestart dec state.todoBeforeRestart
if state.todoBeforeRestart <= 0: if state.todoBeforeRestart <= 0:
if state.bitsBuffered < 24: if state.pos + 1 > state.len:
state.fillBitBuffer() failInvalid()
if state.buffer[state.pos] != 0xFF or
if state.buffer[state.pos] == 0xFF.char: state.buffer[state.pos + 1] notin {0xD0 .. 0xD7}:
if state.buffer[state.pos + 1] in {0xD0.char .. 0xD7.char}:
state.pos += 2
else:
failInvalid("did not get expected restart marker") failInvalid("did not get expected restart marker")
state.pos += 2
state.reset() state.reset()
proc decodeBlocks(state: var DecoderState) = proc decodeBlocks(state: var DecoderState) =
@ -849,8 +849,8 @@ proc decodeBlocks(state: var DecoderState) =
# Single component pass. # Single component pass.
let let
comp = state.componentOrder[0] comp = state.componentOrder[0]
w = (state.components[comp].width + 7) shr 3 w = (state.components[comp].width + 7) div 8
h = (state.components[comp].height + 7) shr 3 h = (state.components[comp].height + 7) div 8
for column in 0 ..< h: for column in 0 ..< h:
for row in 0 ..< w: for row in 0 ..< w:
state.decodeBlock(comp, row, column) state.decodeBlock(comp, row, column)
@ -872,16 +872,27 @@ proc quantizationAndIDCTPass(state: var DecoderState) =
## Does quantization and IDCT. ## Does quantization and IDCT.
for comp in 0 ..< state.components.len: for comp in 0 ..< state.components.len:
let let
w = (state.components[comp].width + 7) shr 3 w = (state.components[comp].width + 7) div 8
h = (state.components[comp].height + 7) shr 3 h = (state.components[comp].height + 7) div 8
qTableId = state.components[comp].quantizationTableId qTableId = state.components[comp].quantizationTableId
if qTableId.int notin 0 ..< state.quantizationTables.len: if qTableId.int notin 0 ..< state.quantizationTables.len:
failInvalid() failInvalid()
for column in 0 ..< h: for column in 0 ..< h:
for row in 0 ..< w: for row in 0 ..< w:
var data {.byaddr.} = state.components[comp].blocks[row][column] var data {.byaddr.} = state.components[comp].blocks[row][column]
when defined(amd64) and not defined(pixieNoSimd):
for i in 0 ..< 8: # 8 per pass
var q = mm_loadu_si128(state.quantizationTables[qTableId][i * 8].addr)
q = mm_unpacklo_epi8(q, mm_setzero_si128())
var v = mm_loadu_si128(data[i * 8].addr)
mm_storeu_si128(data[i * 8].addr, mm_mullo_epi16(v, q))
else:
for i in 0 ..< 64: for i in 0 ..< 64:
data[i] = cast[int16](data[i] * state.quantizationTables[qTableId][i].int32) data[i] = cast[int16](
data[i] * state.quantizationTables[qTableId][i].int32
)
state.components[comp].idctBlock( state.components[comp].idctBlock(
state.components[comp].widthStride * column * 8 + row * 8, state.components[comp].widthStride * column * 8 + row * 8,
data data
@ -946,7 +957,10 @@ proc grayScaleToRgbx(gray: uint8): ColorRGBX {.inline.} =
proc buildImage(state: var DecoderState): Image = proc buildImage(state: var DecoderState): Image =
## Takes a jpeg image object and builds a pixie Image from it. ## Takes a jpeg image object and builds a pixie Image from it.
if state.components.len == 3: result = newImage(state.imageWidth, state.imageHeight)
case state.components.len:
of 3:
for component in state.components.mitems: for component in state.components.mitems:
while component.yScale < state.maxYScale: while component.yScale < state.maxYScale:
component.channel = component.channel.magnifyXBy2() component.channel = component.channel.magnifyXBy2()
@ -956,9 +970,6 @@ proc buildImage(state: var DecoderState): Image =
component.channel = component.channel.magnifyYBy2() component.channel = component.channel.magnifyYBy2()
component.xScale *= 2 component.xScale *= 2
result = newImage(state.imageWidth, state.imageHeight)
if state.components.len == 3:
let let
cy = state.components[0].channel cy = state.components[0].channel
cb = state.components[1].channel cb = state.components[1].channel
@ -972,13 +983,15 @@ proc buildImage(state: var DecoderState): Image =
cr.data[channelIndex], cr.data[channelIndex],
) )
inc channelIndex inc channelIndex
elif state.components.len == 1:
of 1:
let cy = state.components[0].channel let cy = state.components[0].channel
for y in 0 ..< state.imageHeight: for y in 0 ..< state.imageHeight:
var channelIndex = cy.dataIndex(0, y) var channelIndex = cy.dataIndex(0, y)
for x in 0 ..< state.imageWidth: for x in 0 ..< state.imageWidth:
result.unsafe[x, y] = grayScaleToRgbx(cy.data[channelIndex]) result.unsafe[x, y] = grayScaleToRgbx(cy.data[channelIndex])
inc channelIndex inc channelIndex
else: else:
failInvalid() failInvalid()
@ -1012,7 +1025,8 @@ proc decodeJpeg*(data: string): Image {.raises: [PixieError].} =
## Decodes the JPEG into an Image. ## Decodes the JPEG into an Image.
var state = DecoderState() var state = DecoderState()
state.buffer = data state.buffer = cast[ptr UncheckedArray[uint8]](data.cstring)
state.len = data.len
while true: while true:
if state.readUint8() != 0xFF: if state.readUint8() != 0xFF:

View file

@ -172,14 +172,14 @@ proc flipVertical*(image: Image) {.raises: [].} =
proc rotate90*(image: Image) {.raises: [PixieError].} = proc rotate90*(image: Image) {.raises: [PixieError].} =
## Rotates the image 90 degrees clockwise. ## Rotates the image 90 degrees clockwise.
let copy = newImage(image.height, image.width) let rotated = newImage(image.height, image.width)
for y in 0 ..< copy.height: for y in 0 ..< rotated.height:
for x in 0 ..< copy.width: for x in 0 ..< rotated.width:
copy.data[copy.dataIndex(x, y)] = rotated.data[rotated.dataIndex(x, y)] =
image.data[image.dataIndex(y, image.height - x - 1)] image.data[image.dataIndex(y, image.height - x - 1)]
image.width = copy.width image.width = rotated.width
image.height = copy.height image.height = rotated.height
image.data = copy.data image.data = move rotated.data
proc subImage*(image: Image, x, y, w, h: int): Image {.raises: [PixieError].} = proc subImage*(image: Image, x, y, w, h: int): Image {.raises: [PixieError].} =
## Gets a sub image from this image. ## Gets a sub image from this image.

View file

@ -1143,7 +1143,7 @@ proc partitionSegments(
partition.requiresAntiAliasing = partition.requiresAntiAliasing =
requiresAntiAliasing(partition.entries) requiresAntiAliasing(partition.entries)
proc getIndexForY(partitioning: Partitioning, y: int): uint32 {.inline.} = proc getIndexForY(partitioning: var Partitioning, y: int): uint32 {.inline.} =
if partitioning.partitions.len == 1: if partitioning.partitions.len == 1:
0.uint32 0.uint32
else: else:
@ -1152,7 +1152,7 @@ proc getIndexForY(partitioning: Partitioning, y: int): uint32 {.inline.} =
partitioning.partitions.high.uint32 partitioning.partitions.high.uint32
) )
proc maxEntryCount(partitioning: Partitioning): int = proc maxEntryCount(partitioning: var Partitioning): int =
for i in 0 ..< partitioning.partitions.len: for i in 0 ..< partitioning.partitions.len:
result = max(result, partitioning.partitions[i].entries.len) result = max(result, partitioning.partitions[i].entries.len)
@ -1240,12 +1240,10 @@ proc computeCoverage(
aa: var bool, aa: var bool,
width: float32, width: float32,
y, startX: int, y, startX: int,
partitioning: Partitioning, partitioning: var Partitioning,
windingRule: WindingRule windingRule: WindingRule
) {.inline.} = ) {.inline.} =
let let partitionIndex = partitioning.getIndexForY(y)
partitionIndex = partitioning.getIndexForY(y)
partitionEntryCount = partitioning.partitions[partitionIndex].entries.len
aa = partitioning.partitions[partitionIndex].requiresAntiAliasing aa = partitioning.partitions[partitionIndex].requiresAntiAliasing
@ -1259,8 +1257,7 @@ proc computeCoverage(
for m in 0 ..< quality: for m in 0 ..< quality:
yLine += offset yLine += offset
numHits = 0 numHits = 0
for i in 0 ..< partitionEntryCount: # Perf for entry in partitioning.partitions[partitionIndex].entries.mitems:
let entry = partitioning.partitions[partitionIndex].entries[i].unsafeAddr # Perf
if entry.segment.at.y <= yLine and entry.segment.to.y >= yLine: if entry.segment.at.y <= yLine and entry.segment.to.y >= yLine:
let x = let x =
if entry.m == 0: if entry.m == 0:
@ -1620,7 +1617,6 @@ proc fillShapes(
else: else:
0 0
pathHeight = min(image.height, (bounds.y + bounds.h).int) pathHeight = min(image.height, (bounds.y + bounds.h).int)
partitioning = partitionSegments(segments, startY, pathHeight - startY)
if pathWidth == 0: if pathWidth == 0:
return return
@ -1629,6 +1625,7 @@ proc fillShapes(
raise newException(PixieError, "Path int overflow detected") raise newException(PixieError, "Path int overflow detected")
var var
partitioning = partitionSegments(segments, startY, pathHeight - startY)
coverages = newSeq[uint8](pathWidth) coverages = newSeq[uint8](pathWidth)
hits = newSeq[(float32, int16)](partitioning.maxEntryCount) hits = newSeq[(float32, int16)](partitioning.maxEntryCount)
numHits: int numHits: int
@ -1689,7 +1686,6 @@ proc fillShapes(
else: else:
0 0
pathHeight = min(mask.height, (bounds.y + bounds.h).int) pathHeight = min(mask.height, (bounds.y + bounds.h).int)
partitioning = partitionSegments(segments, startY, pathHeight)
if pathWidth == 0: if pathWidth == 0:
return return
@ -1698,6 +1694,7 @@ proc fillShapes(
raise newException(PixieError, "Path int overflow detected") raise newException(PixieError, "Path int overflow detected")
var var
partitioning = partitionSegments(segments, startY, pathHeight)
coverages = newSeq[uint8](pathWidth) coverages = newSeq[uint8](pathWidth)
hits = newSeq[(float32, int16)](partitioning.maxEntryCount) hits = newSeq[(float32, int16)](partitioning.maxEntryCount)
numHits: int numHits: int

View file

@ -63,6 +63,11 @@ timeIt "flipVertical":
reset() reset()
timeIt "rotate90":
image.rotate90()
reset()
timeIt "invert": timeIt "invert":
image.invert() image.invert()

View file

@ -9,7 +9,7 @@ for file in jpegSuiteFiles:
let genFile = file.replace("masters", "generated").replace(".jpg", ".png") let genFile = file.replace("masters", "generated").replace(".jpg", ".png")
img.writeFile(genFile) img.writeFile(genFile)
if execShellCmd(&"magick {file} {genFile}") != 0: if execShellCmd(&"magick {file} -auto-orient {genFile}") != 0:
echo "fail" echo "fail"
var img2 = readImage(genFile) var img2 = readImage(genFile)