From c7dd442a30bf64388dfeb7aaabf06e62d6b8afb9 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Sun, 22 May 2022 19:04:37 -0500 Subject: [PATCH 01/29] f --- src/pixie/paths.nim | 17 +++++++---------- 1 file changed, 7 insertions(+), 10 deletions(-) diff --git a/src/pixie/paths.nim b/src/pixie/paths.nim index ce37c1c..414a619 100644 --- a/src/pixie/paths.nim +++ b/src/pixie/paths.nim @@ -1143,7 +1143,7 @@ proc partitionSegments( partition.requiresAntiAliasing = requiresAntiAliasing(partition.entries) -proc getIndexForY(partitioning: Partitioning, y: int): uint32 {.inline.} = +proc getIndexForY(partitioning: var Partitioning, y: int): uint32 {.inline.} = if partitioning.partitions.len == 1: 0.uint32 else: @@ -1152,7 +1152,7 @@ proc getIndexForY(partitioning: Partitioning, y: int): uint32 {.inline.} = partitioning.partitions.high.uint32 ) -proc maxEntryCount(partitioning: Partitioning): int = +proc maxEntryCount(partitioning: var Partitioning): int = for i in 0 ..< partitioning.partitions.len: result = max(result, partitioning.partitions[i].entries.len) @@ -1240,12 +1240,10 @@ proc computeCoverage( aa: var bool, width: float32, y, startX: int, - partitioning: Partitioning, + partitioning: var Partitioning, windingRule: WindingRule ) {.inline.} = - let - partitionIndex = partitioning.getIndexForY(y) - partitionEntryCount = partitioning.partitions[partitionIndex].entries.len + let partitionIndex = partitioning.getIndexForY(y) aa = partitioning.partitions[partitionIndex].requiresAntiAliasing @@ -1259,8 +1257,7 @@ proc computeCoverage( for m in 0 ..< quality: yLine += offset numHits = 0 - for i in 0 ..< partitionEntryCount: # Perf - let entry = partitioning.partitions[partitionIndex].entries[i].unsafeAddr # Perf + for entry in partitioning.partitions[partitionIndex].entries.mitems: if entry.segment.at.y <= yLine and entry.segment.to.y >= yLine: let x = if entry.m == 0: @@ -1620,7 +1617,6 @@ proc fillShapes( else: 0 pathHeight = min(image.height, (bounds.y + bounds.h).int) - partitioning = partitionSegments(segments, startY, pathHeight - startY) if pathWidth == 0: return @@ -1629,6 +1625,7 @@ proc fillShapes( raise newException(PixieError, "Path int overflow detected") var + partitioning = partitionSegments(segments, startY, pathHeight - startY) coverages = newSeq[uint8](pathWidth) hits = newSeq[(float32, int16)](partitioning.maxEntryCount) numHits: int @@ -1689,7 +1686,6 @@ proc fillShapes( else: 0 pathHeight = min(mask.height, (bounds.y + bounds.h).int) - partitioning = partitionSegments(segments, startY, pathHeight) if pathWidth == 0: return @@ -1698,6 +1694,7 @@ proc fillShapes( raise newException(PixieError, "Path int overflow detected") var + partitioning = partitionSegments(segments, startY, pathHeight) coverages = newSeq[uint8](pathWidth) hits = newSeq[(float32, int16)](partitioning.maxEntryCount) numHits: int From e9f09a14dd5b89e9afd796f2c6219c0c46493663 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 18:21:55 -0500 Subject: [PATCH 02/29] avoid copying data --- src/pixie/fileformats/jpeg.nim | 23 +++++++++++++---------- 1 file changed, 13 insertions(+), 10 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index d5c8e65..811ad06 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -65,8 +65,9 @@ type channel: Mask DecoderState = object - buffer: string - pos, bitsBuffered: int + buffer: ptr UncheckedArray[uint8] + len, pos: int + bitsBuffered: int bitBuffer: uint32 hitEnd: bool imageHeight, imageWidth: int @@ -102,9 +103,9 @@ template clampByte(x: int32): uint8 = proc readUint8(state: var DecoderState): uint8 = ## Reads a byte from the input stream. - if state.pos >= state.buffer.len: + if state.pos >= state.len: failInvalid() - result = cast[uint8](state.buffer[state.pos]) + result = state.buffer[state.pos] inc state.pos proc readUint16be(state: var DecoderState): uint16 = @@ -121,14 +122,15 @@ proc readUint32be(state: var DecoderState): uint32 = proc readStr(state: var DecoderState, n: int): string = ## Reads n number of bytes as a string. - if state.pos + n > state.buffer.len: + if state.pos + n > state.len: failInvalid() - result = state.buffer[state.pos ..< state.pos + n] + result.setLen(n) + copyMem(result[0].addr, state.buffer[state.pos].addr, n) state.pos += n proc skipBytes(state: var DecoderState, n: int) = ## Skips a number of bytes. - if state.pos + n > state.buffer.len: + if state.pos + n > state.len: failInvalid() state.pos += n @@ -836,8 +838,8 @@ proc checkRestart(state: var DecoderState) = if state.bitsBuffered < 24: state.fillBitBuffer() - if state.buffer[state.pos] == 0xFF.char: - if state.buffer[state.pos + 1] in {0xD0.char .. 0xD7.char}: + if state.buffer[state.pos] == 0xFF: + if state.buffer[state.pos + 1] in {0xD0 .. 0xD7}: state.pos += 2 else: failInvalid("did not get expected restart marker") @@ -1012,7 +1014,8 @@ proc decodeJpeg*(data: string): Image {.raises: [PixieError].} = ## Decodes the JPEG into an Image. var state = DecoderState() - state.buffer = data + state.buffer = cast[ptr UncheckedArray[uint8]](data[0].unsafeAddr) + state.len = data.len while true: if state.readUint8() != 0xFF: From 268e653b05e01161837c786a00a9a476086ef8c8 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 18:22:49 -0500 Subject: [PATCH 03/29] no cost --- src/pixie/fileformats/jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 811ad06..e2c1990 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -93,7 +93,7 @@ template failInvalid(reason = "unable to load") = ## Throw exception with a reason. raise newException(PixieError, "Invalid JPEG, " & reason) -template clampByte(x: int32): uint8 = +proc clampByte(x: int32): uint8 {.inline.} = ## Clamp integer into byte range. # clamp(x, 0, 0xFF).uint8 let From e67f257479202f5df922089b8418affc7a1a62ab Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 18:30:48 -0500 Subject: [PATCH 04/29] faster --- src/pixie/fileformats/jpeg.nim | 20 ++++++++++++++------ 1 file changed, 14 insertions(+), 6 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index e2c1990..8d0695a 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -110,15 +110,23 @@ proc readUint8(state: var DecoderState): uint8 = proc readUint16be(state: var DecoderState): uint16 = ## Reads uint16 big-endian from the input stream. - (state.readUint8().uint16 shl 8) or state.readUint8() + if state.pos + 2 > state.len: + failInvalid() + result = + (state.buffer[state.pos].uint16 shl 8) or + state.buffer[state.pos + 1] + state.pos += 2 proc readUint32be(state: var DecoderState): uint32 = ## Reads uint32 big-endian from the input stream. - return - (state.readUint8().uint32 shl 24) or - (state.readUint8().uint32 shl 16) or - (state.readUint8().uint32 shl 8) or - state.readUint8().uint32 + if state.pos + 4 > state.len: + failInvalid() + result = + (state.buffer[state.pos + 0].uint32 shl 24) or + (state.buffer[state.pos + 1].uint32 shl 16) or + (state.buffer[state.pos + 2].uint32 shl 8) or + state.buffer[state.pos + 3] + state.pos += 4 proc readStr(state: var DecoderState, n: int): string = ## Reads n number of bytes as a string. From 49acd68ce9c0848145ff7c3aa03235f887d02fad Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 18:54:13 -0500 Subject: [PATCH 05/29] 2x faster --- src/pixie/images.nim | 14 +++++++------- tests/benchmark_images.nim | 5 +++++ 2 files changed, 12 insertions(+), 7 deletions(-) diff --git a/src/pixie/images.nim b/src/pixie/images.nim index a5fb534..ce3b415 100644 --- a/src/pixie/images.nim +++ b/src/pixie/images.nim @@ -172,14 +172,14 @@ proc flipVertical*(image: Image) {.raises: [].} = proc rotate90*(image: Image) {.raises: [PixieError].} = ## Rotates the image 90 degrees clockwise. - let copy = newImage(image.height, image.width) - for y in 0 ..< copy.height: - for x in 0 ..< copy.width: - copy.data[copy.dataIndex(x, y)] = + let rotated = newImage(image.height, image.width) + for y in 0 ..< rotated.height: + for x in 0 ..< rotated.width: + rotated.data[rotated.dataIndex(x, y)] = image.data[image.dataIndex(y, image.height - x - 1)] - image.width = copy.width - image.height = copy.height - image.data = copy.data + image.width = rotated.width + image.height = rotated.height + image.data = move rotated.data proc subImage*(image: Image, x, y, w, h: int): Image {.raises: [PixieError].} = ## Gets a sub image from this image. diff --git a/tests/benchmark_images.nim b/tests/benchmark_images.nim index 7be2761..60cd261 100644 --- a/tests/benchmark_images.nim +++ b/tests/benchmark_images.nim @@ -63,6 +63,11 @@ timeIt "flipVertical": reset() +timeIt "rotate90": + image.rotate90() + +reset() + timeIt "invert": image.invert() From 5c04aacbe2e46d082d14513cf1c7bf19f92c84b7 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 18:57:33 -0500 Subject: [PATCH 06/29] better check --- src/pixie/fileformats/jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 8d0695a..43a9146 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -276,7 +276,7 @@ proc decodeSOF0(state: var DecoderState) = if quantizationTableId > 3: failInvalid("invalid quantization table id") - if vertical == 0 or vertical > 4 or horizontal == 0 or horizontal > 4: + if vertical notin {0, 1, 2, 4} or horizontal notin {0, 1, 2, 4}: failInvalid("invalid component scaling factor") component.xScale = vertical.int From 102215a611e368aa928e5e23e7ca8f0a93d72ba7 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 18:59:52 -0500 Subject: [PATCH 07/29] f --- src/pixie/fileformats/jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 43a9146..aeba663 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -69,7 +69,6 @@ type len, pos: int bitsBuffered: int bitBuffer: uint32 - hitEnd: bool imageHeight, imageWidth: int quantizationTables: array[4, array[64, uint8]] huffmanTables: array[2, array[4, Huffman]] # 0 = DC, 1 = AC @@ -84,6 +83,7 @@ type restartInterval: int todoBeforeRestart: int eobRun: int + hitEnd: bool orientation: int when defined(release): From dd2571d3a6c7a45aea9538f5b2602747f2cfa286 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:10:24 -0500 Subject: [PATCH 08/29] f --- src/pixie/fileformats/jpeg.nim | 12 +++++------- 1 file changed, 5 insertions(+), 7 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index aeba663..71c60d7 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -73,11 +73,11 @@ type quantizationTables: array[4, array[64, uint8]] huffmanTables: array[2, array[4, Huffman]] # 0 = DC, 1 = AC components: seq[Component] + maxYScale, maxXScale: int + mcuWidth, mcuHeight, numMcuWide, numMcuHigh: int scanComponents: int spectralStart, spectralEnd: int successiveApproxLow, successiveApproxHigh: int - maxYScale, maxXScale: int - mcuWidth, mcuHeight, numMcuWide, numMcuHigh: int componentOrder: seq[int] progressive: bool restartInterval: int @@ -324,9 +324,7 @@ proc decodeSOF0(state: var DecoderState) = if state.progressive: component.widthCoeff = component.widthStride div 8 component.heightCoeff = component.heightStride div 8 - component.coeff.setLen( - component.widthStride * component.heightStride - ) + component.coeff.setLen(component.widthStride * component.heightStride) if len != 0: failInvalid() @@ -428,11 +426,11 @@ proc decodeSOS(state: var DecoderState) = failInvalid() var component: int - while component < 3: + while component < state.components.len: if state.components[component].id == id: break inc component - if component == 3: + if component == state.components.len: failInvalid() # Not found state.components[component].huffmanAC = huffmanAC.int From 871740a95e7f2a8e6cc42e8c9eadfd912bfd7121 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:10:38 -0500 Subject: [PATCH 09/29] fuzz fix --- src/pixie/fileformats/jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 71c60d7..29ee736 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -1020,7 +1020,7 @@ proc decodeJpeg*(data: string): Image {.raises: [PixieError].} = ## Decodes the JPEG into an Image. var state = DecoderState() - state.buffer = cast[ptr UncheckedArray[uint8]](data[0].unsafeAddr) + state.buffer = cast[ptr UncheckedArray[uint8]](data.cstring) state.len = data.len while true: From 3b67e809c5a8a31c63a2351438b848bab7f3b37a Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:13:48 -0500 Subject: [PATCH 10/29] f --- src/pixie/fileformats/jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 29ee736..05cbee1 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -410,7 +410,7 @@ proc decodeSOS(state: var DecoderState) = if state.scanComponents > state.components.len: failInvalid("extra components") - if state.scanComponents notin [1, 3]: + if state.scanComponents notin {1, 3}: failInvalid("unsupported scan component count") state.componentOrder.setLen(0) From 07d16c7c8790b6e0f69f1cc8f1c84d75930b56c5 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:20:45 -0500 Subject: [PATCH 11/29] f --- src/pixie/fileformats/jpeg.nim | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 05cbee1..ae41de4 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -69,12 +69,14 @@ type len, pos: int bitsBuffered: int bitBuffer: uint32 + imageHeight, imageWidth: int quantizationTables: array[4, array[64, uint8]] huffmanTables: array[2, array[4, Huffman]] # 0 = DC, 1 = AC components: seq[Component] maxYScale, maxXScale: int mcuWidth, mcuHeight, numMcuWide, numMcuHigh: int + scanComponents: int spectralStart, spectralEnd: int successiveApproxLow, successiveApproxHigh: int @@ -857,8 +859,8 @@ proc decodeBlocks(state: var DecoderState) = # Single component pass. let comp = state.componentOrder[0] - w = (state.components[comp].width + 7) shr 3 - h = (state.components[comp].height + 7) shr 3 + w = (state.components[comp].width + 7) div 8 + h = (state.components[comp].height + 7) div 8 for column in 0 ..< h: for row in 0 ..< w: state.decodeBlock(comp, row, column) @@ -880,8 +882,8 @@ proc quantizationAndIDCTPass(state: var DecoderState) = ## Does quantization and IDCT. for comp in 0 ..< state.components.len: let - w = (state.components[comp].width + 7) shr 3 - h = (state.components[comp].height + 7) shr 3 + w = (state.components[comp].width + 7) div 8 + h = (state.components[comp].height + 7) div 8 qTableId = state.components[comp].quantizationTableId if qTableId.int notin 0 ..< state.quantizationTables.len: failInvalid() From 297ddc6c6016b9df6e3cda647b1b4b2b03e293f3 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:22:17 -0500 Subject: [PATCH 12/29] f --- src/pixie/fileformats/jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index ae41de4..ea3d4d5 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -521,7 +521,7 @@ proc huffmanDecode(state: var DecoderState, tableCurrent, table: int): uint8 = return huffman.symbols[symbolId] template lrot(value: uint32, shift: int): uint32 = - ## Left rotate - used for huffman decoding. + ## Left rotate (value shl shift) or (value shr (32 - shift)) proc getBit(state: var DecoderState): int = From d49ef8be19304456f2822750784690d407114048 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:35:28 -0500 Subject: [PATCH 13/29] f --- src/pixie/fileformats/jpeg.nim | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index ea3d4d5..d734de2 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -446,8 +446,6 @@ proc decodeSOS(state: var DecoderState) = state.successiveApproxLow = aa and 15 state.successiveApproxHigh = aa shr 4 - state.reset() - if state.progressive: if state.spectralStart > 63 or state.spectralEnd > 63: failInvalid() @@ -467,6 +465,8 @@ proc decodeSOS(state: var DecoderState) = if len != 0: failInvalid() + state.reset() + proc fillBitBuffer(state: var DecoderState) = ## When we are low on bits, we need to call this to populate some more. while state.bitsBuffered < 24: From 403a2b95a8867b9a8826633b28dbd5a95610d50a Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:39:22 -0500 Subject: [PATCH 14/29] f --- src/pixie/fileformats/jpeg.nim | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index d734de2..45f0ec4 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -69,24 +69,23 @@ type len, pos: int bitsBuffered: int bitBuffer: uint32 - imageHeight, imageWidth: int + progressive: bool quantizationTables: array[4, array[64, uint8]] huffmanTables: array[2, array[4, Huffman]] # 0 = DC, 1 = AC components: seq[Component] maxYScale, maxXScale: int mcuWidth, mcuHeight, numMcuWide, numMcuHigh: int + orientation: int scanComponents: int spectralStart, spectralEnd: int successiveApproxLow, successiveApproxHigh: int componentOrder: seq[int] - progressive: bool restartInterval: int todoBeforeRestart: int eobRun: int hitEnd: bool - orientation: int when defined(release): {.push checks: off.} From 75f630f824ae4126161a6de37aeafd853277c33f Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:41:33 -0500 Subject: [PATCH 15/29] case --- src/pixie/fileformats/jpeg.nim | 12 +++++++----- 1 file changed, 7 insertions(+), 5 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 45f0ec4..9ca1375 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -955,7 +955,10 @@ proc grayScaleToRgbx(gray: uint8): ColorRGBX {.inline.} = proc buildImage(state: var DecoderState): Image = ## Takes a jpeg image object and builds a pixie Image from it. - if state.components.len == 3: + result = newImage(state.imageWidth, state.imageHeight) + + case state.components.len: + of 3: for component in state.components.mitems: while component.yScale < state.maxYScale: component.channel = component.channel.magnifyXBy2() @@ -965,9 +968,6 @@ proc buildImage(state: var DecoderState): Image = component.channel = component.channel.magnifyYBy2() component.xScale *= 2 - result = newImage(state.imageWidth, state.imageHeight) - - if state.components.len == 3: let cy = state.components[0].channel cb = state.components[1].channel @@ -981,13 +981,15 @@ proc buildImage(state: var DecoderState): Image = cr.data[channelIndex], ) inc channelIndex - elif state.components.len == 1: + + of 1: let cy = state.components[0].channel for y in 0 ..< state.imageHeight: var channelIndex = cy.dataIndex(0, y) for x in 0 ..< state.imageWidth: result.unsafe[x, y] = grayScaleToRgbx(cy.data[channelIndex]) inc channelIndex + else: failInvalid() From b360b68fe8f1ab34b0bebd34df696d595415e11d Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 19:57:47 -0500 Subject: [PATCH 16/29] f --- src/pixie/fileformats/jpeg.nim | 14 ++++++-------- 1 file changed, 6 insertions(+), 8 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 9ca1375..0235ad0 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -842,14 +842,12 @@ proc checkRestart(state: var DecoderState) = ## Check if we might have run into a restart marker, then deal with it. dec state.todoBeforeRestart if state.todoBeforeRestart <= 0: - if state.bitsBuffered < 24: - state.fillBitBuffer() - - if state.buffer[state.pos] == 0xFF: - if state.buffer[state.pos + 1] in {0xD0 .. 0xD7}: - state.pos += 2 - else: - failInvalid("did not get expected restart marker") + if state.pos + 1 > state.len: + failInvalid() + if state.buffer[state.pos] != 0xFF or + state.buffer[state.pos + 1] notin {0xD0 .. 0xD7}: + failInvalid("did not get expected restart marker") + state.pos += 2 state.reset() proc decodeBlocks(state: var DecoderState) = From 7ca2d51a9b8c2012322dd9c42341239fa1a7a40f Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 20:09:21 -0500 Subject: [PATCH 17/29] f --- src/pixie/fileformats/jpeg.nim | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 0235ad0..e7c79b4 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -393,9 +393,9 @@ proc reset(state: var DecoderState) = ## Rests the decoder state need for restart markers. state.bitBuffer = 0 state.bitsBuffered = 0 + state.hitEnd = false for component in 0 ..< state.components.len: state.components[component].dcPred = 0 - state.hitEnd = false if state.restartInterval != 0: state.todoBeforeRestart = state.restartInterval else: @@ -468,7 +468,7 @@ proc decodeSOS(state: var DecoderState) = proc fillBitBuffer(state: var DecoderState) = ## When we are low on bits, we need to call this to populate some more. - while state.bitsBuffered < 24: + while state.bitsBuffered <= 24: let b = if state.hitEnd: 0.uint32 From 4dc81592f67f9d1f38fedee3ca38266611e8ed31 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 20:56:54 -0500 Subject: [PATCH 18/29] some simd --- src/pixie/fileformats/jpeg.nim | 18 ++++++++++++++++-- 1 file changed, 16 insertions(+), 2 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index e7c79b4..fa32e67 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -1,6 +1,9 @@ import pixie/common, pixie/images, pixie/masks, sequtils, strutils, chroma, std/decls, flatty/binny +when defined(amd64) and not defined(pixieNoSimd): + import nimsimd/sse2 + # This JPEG decoder is loosely based on stb_image which is public domain. # JPEG is a complex format, this decoder only supports the most common features: @@ -887,8 +890,19 @@ proc quantizationAndIDCTPass(state: var DecoderState) = for column in 0 ..< h: for row in 0 ..< w: var data {.byaddr.} = state.components[comp].blocks[row][column] - for i in 0 ..< 64: - data[i] = cast[int16](data[i] * state.quantizationTables[qTableId][i].int32) + + when defined(amd64) and not defined(pixieNoSimd): + for i in 0 ..< 8: # 8 per pass + var q = mm_loadu_si128(state.quantizationTables[qTableId][i * 8].addr) + q = mm_unpacklo_epi8(q, mm_setzero_si128()) + var v = mm_loadu_si128(data[i * 8].addr) + mm_storeu_si128(data[i * 8].addr, mm_mullo_epi16(v, q)) + else: + for i in 0 ..< 64: + data[i] = cast[int16]( + data[i] * state.quantizationTables[qTableId][i].int32 + ) + state.components[comp].idctBlock( state.components[comp].widthStride * column * 8 + row * 8, data From 18f8d63e203cf9d1d768e2be9b9a09be8ca45df5 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 21:08:14 -0500 Subject: [PATCH 19/29] fix --- src/pixie/fileformats/jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index fa32e67..09100f2 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -280,7 +280,7 @@ proc decodeSOF0(state: var DecoderState) = if quantizationTableId > 3: failInvalid("invalid quantization table id") - if vertical notin {0, 1, 2, 4} or horizontal notin {0, 1, 2, 4}: + if vertical notin {1, 2, 4} or horizontal notin {1, 2, 4}: failInvalid("invalid component scaling factor") component.xScale = vertical.int From fc3b30ccd2069dda2711381d7cddb5daaa803019 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 21:42:55 -0500 Subject: [PATCH 20/29] significant mem savings --- src/pixie/fileformats/jpeg.nim | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 09100f2..4656ab4 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -315,9 +315,9 @@ proc decodeSOF0(state: var DecoderState) = # Allocate block data structures. component.blocks = newSeqWith( - component.width, + state.numMcuWide * component.yScale, newSeq[array[64, int16]]( - component.height + state.numMcuHigh * component.xScale ) ) From 11bd83b49582a88fad605519d0fd97eaa30e939a Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 21:46:32 -0500 Subject: [PATCH 21/29] f --- src/pixie/fileformats/jpeg.nim | 1 - 1 file changed, 1 deletion(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 4656ab4..bd78aa7 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -80,7 +80,6 @@ type maxYScale, maxXScale: int mcuWidth, mcuHeight, numMcuWide, numMcuHigh: int orientation: int - scanComponents: int spectralStart, spectralEnd: int successiveApproxLow, successiveApproxHigh: int From 7b1cd09cd35557bec8f1e0bc02201f9e7cabb5ad Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 22:09:07 -0500 Subject: [PATCH 22/29] getBit endian --- src/pixie/fileformats/jpeg.nim | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index bd78aa7..d30c619 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -529,10 +529,9 @@ proc getBit(state: var DecoderState): int = ## Get a single bit. if state.bitsBuffered < 1: state.fillBitBuffer() - let k = state.bitBuffer + result = ((state.bitBuffer and cast[uint32](0x80000000)) shr 31).int state.bitBuffer = state.bitBuffer shl 1 dec state.bitsBuffered - return (k.int and 0x80000000.int) proc getBitsAsSignedInt(state: var DecoderState, n: int): int = ## Get n number of bits as a signed integer. @@ -616,7 +615,7 @@ proc decodeProgressiveBlock( state.components[component].dcPred = dc data[0] = cast[int16](dc * (1 shl state.successiveApproxLow)) else: - if getBit(state) != 0: + if state.getBit() != 0: data[0] = cast[int16](data[0] + (1 shl state.successiveApproxLow)) proc decodeProgressiveContinuationBlock( @@ -689,7 +688,7 @@ proc decodeProgressiveContinuationBlock( else: if s != 1: failInvalid("bad huffman code") - if getBit(state) != 0: + if state.getBit() != 0: s = bit.int else: s = -bit.int @@ -698,7 +697,7 @@ proc decodeProgressiveContinuationBlock( let zig = deZigZag[k] inc k if data[zig] != 0: - if getBit(state) != 0: + if state.getBit() != 0: if (data[zig] and bit) == 0: if data[zig] > 0: data[zig] = cast[int16](data[zig] + bit) From b1d111d1bf8db042413152d49ba021494894218c Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 22:17:41 -0500 Subject: [PATCH 23/29] getBits --- src/pixie/fileformats/jpeg.nim | 11 +++++------ 1 file changed, 5 insertions(+), 6 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index d30c619..1f4418c 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -547,17 +547,16 @@ proc getBitsAsSignedInt(state: var DecoderState, n: int): int = state.bitsBuffered -= n result = k.int + (biases[n] and (not sign)) -proc getBitsAsUnsignedInt(state: var DecoderState, n: int): int = +proc getBits(state: var DecoderState, n: int): int = ## Get n number of bits as a unsigned integer. if n notin 0 .. 16: failInvalid() if state.bitsBuffered < n: state.fillBitBuffer() - var k = lrot(state.bitBuffer, n) + let k = lrot(state.bitBuffer, n) state.bitBuffer = k and (not bitMasks[n]) - k = k and bitMasks[n] + result = (k and bitMasks[n]).int state.bitsBuffered -= n - return k.int proc decodeRegularBlock( state: var DecoderState, component: int, data: var array[64, int16] @@ -642,7 +641,7 @@ proc decodeProgressiveContinuationBlock( if r < 15: state.eobRun = 1 shl r if r != 0: - state.eobRun += state.getBitsAsUnsignedInt(r) + state.eobRun += state.getBits(r) dec state.eobRun break k += 16 @@ -681,7 +680,7 @@ proc decodeProgressiveContinuationBlock( if r < 15: state.eobRun = (1 shl r) - 1 if r != 0: - state.eobRun += state.getBitsAsUnsignedInt(r) + state.eobRun += state.getBits(r) r = 64 # force end of block else: discard From 583c797b4020b6a37e48b31d72aaa433e45f65b5 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 22:17:50 -0500 Subject: [PATCH 24/29] move --- src/pixie/fileformats/jpeg.nim | 22 +++++++++++----------- 1 file changed, 11 insertions(+), 11 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 1f4418c..450aa9e 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -533,6 +533,17 @@ proc getBit(state: var DecoderState): int = state.bitBuffer = state.bitBuffer shl 1 dec state.bitsBuffered +proc getBits(state: var DecoderState, n: int): int = + ## Get n number of bits as a unsigned integer. + if n notin 0 .. 16: + failInvalid() + if state.bitsBuffered < n: + state.fillBitBuffer() + let k = lrot(state.bitBuffer, n) + state.bitBuffer = k and (not bitMasks[n]) + result = (k and bitMasks[n]).int + state.bitsBuffered -= n + proc getBitsAsSignedInt(state: var DecoderState, n: int): int = ## Get n number of bits as a signed integer. # TODO: Investigate why 15 not 16? @@ -547,17 +558,6 @@ proc getBitsAsSignedInt(state: var DecoderState, n: int): int = state.bitsBuffered -= n result = k.int + (biases[n] and (not sign)) -proc getBits(state: var DecoderState, n: int): int = - ## Get n number of bits as a unsigned integer. - if n notin 0 .. 16: - failInvalid() - if state.bitsBuffered < n: - state.fillBitBuffer() - let k = lrot(state.bitBuffer, n) - state.bitBuffer = k and (not bitMasks[n]) - result = (k and bitMasks[n]).int - state.bitsBuffered -= n - proc decodeRegularBlock( state: var DecoderState, component: int, data: var array[64, int16] ) = From 8caaca13c0cb4a4f24154d178e1767e49ee4f08f Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 22:22:42 -0500 Subject: [PATCH 25/29] f --- src/pixie/fileformats/jpeg.nim | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 450aa9e..04139bd 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -540,8 +540,8 @@ proc getBits(state: var DecoderState, n: int): int = if state.bitsBuffered < n: state.fillBitBuffer() let k = lrot(state.bitBuffer, n) - state.bitBuffer = k and (not bitMasks[n]) result = (k and bitMasks[n]).int + state.bitBuffer = k and (not bitMasks[n]) state.bitsBuffered -= n proc getBitsAsSignedInt(state: var DecoderState, n: int): int = @@ -551,12 +551,12 @@ proc getBitsAsSignedInt(state: var DecoderState, n: int): int = failInvalid() if state.bitsBuffered < n: state.fillBitBuffer() - let sign = cast[int32](state.bitBuffer) shr 31 - var k = lrot(state.bitBuffer, n) + let + sign = cast[int32](state.bitBuffer) shr 31 # Sign is always in MSB + k = lrot(state.bitBuffer, n) + result = (k and bitMasks[n]).int + (biases[n] and (not sign)) state.bitBuffer = k and (not bitMasks[n]) - k = k and bitMasks[n] state.bitsBuffered -= n - result = k.int + (biases[n] and (not sign)) proc decodeRegularBlock( state: var DecoderState, component: int, data: var array[64, int16] From 0c075e6774274016b4a365fbc1c2f79d7833c14c Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 22:23:37 -0500 Subject: [PATCH 26/29] get -> read --- src/pixie/fileformats/jpeg.nim | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 04139bd..5eb76b8 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -525,7 +525,7 @@ template lrot(value: uint32, shift: int): uint32 = ## Left rotate (value shl shift) or (value shr (32 - shift)) -proc getBit(state: var DecoderState): int = +proc readBit(state: var DecoderState): int = ## Get a single bit. if state.bitsBuffered < 1: state.fillBitBuffer() @@ -533,7 +533,7 @@ proc getBit(state: var DecoderState): int = state.bitBuffer = state.bitBuffer shl 1 dec state.bitsBuffered -proc getBits(state: var DecoderState, n: int): int = +proc readBits(state: var DecoderState, n: int): int = ## Get n number of bits as a unsigned integer. if n notin 0 .. 16: failInvalid() @@ -614,7 +614,7 @@ proc decodeProgressiveBlock( state.components[component].dcPred = dc data[0] = cast[int16](dc * (1 shl state.successiveApproxLow)) else: - if state.getBit() != 0: + if state.readBit() != 0: data[0] = cast[int16](data[0] + (1 shl state.successiveApproxLow)) proc decodeProgressiveContinuationBlock( @@ -641,7 +641,7 @@ proc decodeProgressiveContinuationBlock( if r < 15: state.eobRun = 1 shl r if r != 0: - state.eobRun += state.getBits(r) + state.eobRun += state.readBits(r) dec state.eobRun break k += 16 @@ -663,7 +663,7 @@ proc decodeProgressiveContinuationBlock( for k in state.spectralStart ..< state.spectralEnd: let zig = deZigZag[k] if data[zig] != 0: - if state.getBit() != 0: + if state.readBit() != 0: if (data[zig] and bit) == 0: if data[zig] > 0: data[zig] = cast[int16](data[zig] + bit) @@ -680,14 +680,14 @@ proc decodeProgressiveContinuationBlock( if r < 15: state.eobRun = (1 shl r) - 1 if r != 0: - state.eobRun += state.getBits(r) + state.eobRun += state.readBits(r) r = 64 # force end of block else: discard else: if s != 1: failInvalid("bad huffman code") - if state.getBit() != 0: + if state.readBit() != 0: s = bit.int else: s = -bit.int @@ -696,7 +696,7 @@ proc decodeProgressiveContinuationBlock( let zig = deZigZag[k] inc k if data[zig] != 0: - if state.getBit() != 0: + if state.readBit() != 0: if (data[zig] and bit) == 0: if data[zig] > 0: data[zig] = cast[int16](data[zig] + bit) From 43b776bb94614b830539e569b166086953c444c3 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 23:18:22 -0500 Subject: [PATCH 27/29] just follow spec --- src/pixie/fileformats/jpeg.nim | 31 ++++++++++++++----------------- 1 file changed, 14 insertions(+), 17 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index 5eb76b8..a7b2326 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -544,19 +544,16 @@ proc readBits(state: var DecoderState, n: int): int = state.bitBuffer = k and (not bitMasks[n]) state.bitsBuffered -= n -proc getBitsAsSignedInt(state: var DecoderState, n: int): int = - ## Get n number of bits as a signed integer. - # TODO: Investigate why 15 not 16? - if n notin 0 .. 15: - failInvalid() - if state.bitsBuffered < n: - state.fillBitBuffer() - let - sign = cast[int32](state.bitBuffer) shr 31 # Sign is always in MSB - k = lrot(state.bitBuffer, n) - result = (k and bitMasks[n]).int + (biases[n] and (not sign)) - state.bitBuffer = k and (not bitMasks[n]) - state.bitsBuffered -= n +proc receiveExtend(state: var DecoderState, n: int): int = + ## Get n number of bits as a signed integer. See Jpeg spec pages 109 and 114 + ## for EXTEND and RECEIVE. + var + v = state.readBits(n) + vt = (1 shl (n - 1)) + if v < vt: + vt = (-1 shl n) + 1 + v = v + vt + return v proc decodeRegularBlock( state: var DecoderState, component: int, data: var array[64, int16] @@ -570,7 +567,7 @@ proc decodeRegularBlock( if t == 0: 0 else: - state.getBitsAsSignedInt(t) + state.receiveExtend(t) dc = state.components[component].dcPred + diff state.components[component].dcPred = dc data[0] = cast[int16](dc) @@ -590,7 +587,7 @@ proc decodeRegularBlock( if i >= 64: failInvalid() let zig = deZigZag[i] - data[zig] = cast[int16](state.getBitsAsSignedInt(s.int)) + data[zig] = cast[int16](state.receiveExtend(s.int)) inc i proc decodeProgressiveBlock( @@ -607,7 +604,7 @@ proc decodeProgressiveBlock( let diff = if t > 0: - state.getBitsAsSignedInt(t) + state.receiveExtend(t) else: 0 dc = state.components[component].dcPred + diff @@ -653,7 +650,7 @@ proc decodeProgressiveContinuationBlock( inc k if s >= 15: failInvalid() - data[zig] = cast[int16](state.getBitsAsSignedInt(s.int) * (1 shl shift)) + data[zig] = cast[int16](state.receiveExtend(s.int) * (1 shl shift)) else: var bit = 1 shl state.successiveApproxLow From 123ac5e5552e3fbbcbda605a258733c08823bcd2 Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 23:51:07 -0500 Subject: [PATCH 28/29] unused --- src/pixie/fileformats/jpeg.nim | 4 ---- 1 file changed, 4 deletions(-) diff --git a/src/pixie/fileformats/jpeg.nim b/src/pixie/fileformats/jpeg.nim index a7b2326..f2eebf3 100644 --- a/src/pixie/fileformats/jpeg.nim +++ b/src/pixie/fileformats/jpeg.nim @@ -41,10 +41,6 @@ const 0.uint32, 1, 3, 7, 15, 31, 63, 127, 255, 511, 1023, 2047, 4095, 8191, 16383, 32767, 65535 ] - biases = [ # (-1 shl n) + 1 - 0.int32, -1, -3, -7, -15, -31, -63, -127, -255, - -511, -1023, -2047, -4095, -8191, -16383, -32767 - ] type Huffman = object From 76bde1498c60176a4da6a4f92355e5bde97a45ea Mon Sep 17 00:00:00 2001 From: Ryan Oldenburg Date: Wed, 25 May 2022 23:56:45 -0500 Subject: [PATCH 29/29] fix validate test --- tests/validate_jpeg.nim | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/validate_jpeg.nim b/tests/validate_jpeg.nim index 3f296c6..ce62a7c 100644 --- a/tests/validate_jpeg.nim +++ b/tests/validate_jpeg.nim @@ -9,7 +9,7 @@ for file in jpegSuiteFiles: let genFile = file.replace("masters", "generated").replace(".jpg", ".png") img.writeFile(genFile) - if execShellCmd(&"magick {file} {genFile}") != 0: + if execShellCmd(&"magick {file} -auto-orient {genFile}") != 0: echo "fail" var img2 = readImage(genFile)