From a519ecdf133f58a96bc7ec68529f8ca48e8bbcbe Mon Sep 17 00:00:00 2001
From: Ryan Oldenburg <ryan@guzba.com>
Date: Thu, 16 Jun 2022 01:48:34 -0500
Subject: [PATCH 1/5] implement the last 2 mask:mask blends simd

---
 src/pixie/blends.nim | 41 ++++++++++++++++++++++++++++++++++++++++-
 src/pixie/paths.nim  | 19 +++++++++++++++++--
 2 files changed, 57 insertions(+), 3 deletions(-)

diff --git a/src/pixie/blends.nim b/src/pixie/blends.nim
index 9f0e652..6b04a32 100644
--- a/src/pixie/blends.nim
+++ b/src/pixie/blends.nim
@@ -647,24 +647,63 @@ when defined(amd64) and allowSimd:
 
     mm_or_si128(backdropEven, mm_slli_epi16(backdropOdd, 8))
 
+  proc maskBlendSubtractSimd*(backdrop, source: M128i): M128i {.inline.} =
+    let
+      oddMask = mm_set1_epi16(cast[int16](0xff00))
+      vec255 = mm_set1_epi8(255)
+      div255 = mm_set1_epi16(cast[int16](0x8081))
+
+    let sourceMinus255 = mm_sub_epi8(vec255, source)
+
+    var
+      multiplierEven = mm_slli_epi16(sourceMinus255, 8)
+      multiplierOdd = mm_and_si128(sourceMinus255, oddMask)
+      backdropEven = mm_slli_epi16(backdrop, 8)
+      backdropOdd = mm_and_si128(backdrop, oddMask)
+
+    backdropEven = mm_mulhi_epu16(backdropEven, multiplierEven)
+    backdropOdd = mm_mulhi_epu16(backdropOdd, multiplierOdd)
+
+    backdropEven = mm_srli_epi16(mm_mulhi_epu16(backdropEven, div255), 7)
+    backdropOdd = mm_srli_epi16(mm_mulhi_epu16(backdropOdd, div255), 7)
+
+    mm_or_si128(backdropEven, mm_slli_epi16(backdropOdd, 8))
+
+  proc maskBlendExcludeSimd*(backdrop, source: M128i): M128i {.inline.} =
+    mm_sub_epi8(mm_max_epu8(backdrop, source), mm_min_epu8(backdrop, source))
+
   proc maskBlendNormalSimdMasker(backdrop, source: M128i): M128i =
     maskBlendNormalSimd(backdrop, source)
 
   proc maskBlendMaskSimdMasker(backdrop, source: M128i): M128i =
     maskBlendMaskSimd(backdrop, source)
 
+  proc maskBlendExcludeSimdMasker(backdrop, source: M128i): M128i =
+    maskBlendExcludeSimd(backdrop, source)
+
+  proc maskBlendSubtractSimdMasker(backdrop, source: M128i): M128i =
+    maskBlendSubtractSimd(backdrop, source)
+
   proc maskerSimd*(blendMode: BlendMode): MaskerSimd {.raises: [PixieError].} =
     ## Returns a blend masking function with SIMD support.
     case blendMode:
     of NormalBlend: maskBlendNormalSimdMasker
     of MaskBlend: maskBlendMaskSimdMasker
     of OverwriteBlend: overwriteSimdBlender
+    of SubtractMaskBlend: maskBlendSubtractSimdMasker
+    of ExcludeMaskBlend: maskBlendExcludeSimdMasker
     else:
       raise newException(PixieError, "No SIMD masker for " & $blendMode)
 
   proc hasSimdMasker*(blendMode: BlendMode): bool {.inline, raises: [].} =
     ## Is there a blend masking function with SIMD support?
-    blendMode in {NormalBlend, MaskBlend, OverwriteBlend}
+    blendMode in {
+      NormalBlend,
+      MaskBlend,
+      OverwriteBlend,
+      SubtractMaskBlend,
+      ExcludeMaskBlend
+    }
 
 when defined(release):
   {.pop.}
diff --git a/src/pixie/paths.nim b/src/pixie/paths.nim
index a75582b..1fc1e56 100644
--- a/src/pixie/paths.nim
+++ b/src/pixie/paths.nim
@@ -1572,6 +1572,17 @@ proc fillHits(
   windingRule: WindingRule,
   blendMode: BlendMode
 ) =
+  template simdBlob(mask: Mask, x: var int, blendProc: untyped) =
+    when allowSimd:
+      when defined(amd64):
+        let vec255 = mm_set1_epi8(255)
+        for _ in 0 ..< fillLen div 16:
+          let
+            index = mask.dataIndex(x, y)
+            backdrop = mm_loadu_si128(mask.data[index].addr)
+          mm_storeu_si128(mask.data[index].addr, blendProc(backdrop, vec255))
+          x += 16
+
   case blendMode:
   of NormalBlend, OverwriteBlend:
     walkHits hits, numHits, windingRule, y, mask.width:
@@ -1590,13 +1601,17 @@ proc fillHits(
 
   of SubtractMaskBlend:
     walkHits hits, numHits, windingRule, y, mask.width:
-      for x in fillStart ..< fillStart + fillLen:
+      var x = fillStart
+      simdBlob(mask, x, maskBlendSubtractSimd)
+      for x in x ..< fillStart + fillLen:
         let backdrop = mask.unsafe[x, y]
         mask.unsafe[x, y] = maskBlendSubtract(backdrop, 255)
 
   of ExcludeMaskBlend:
     walkHits hits, numHits, windingRule, y, mask.width:
-      for x in fillStart ..< fillStart + fillLen:
+      var x = fillStart
+      simdBlob(mask, x, maskBlendExcludeSimd)
+      for x in x ..< fillStart + fillLen:
         let backdrop = mask.unsafe[x, y]
         mask.unsafe[x, y] = maskBlendExclude(backdrop, 255)
 

From 1d486783fa9ddd6a022810ca1e9f99158f2b8a93 Mon Sep 17 00:00:00 2001
From: Ryan Oldenburg <ryan@guzba.com>
Date: Thu, 16 Jun 2022 21:54:02 -0500
Subject: [PATCH 2/5] better names

---
 src/pixie/blends.nim | 46 ++++++++++++++++++++++----------------------
 src/pixie/images.nim | 10 +++++-----
 src/pixie/paths.nim  |  8 ++++----
 3 files changed, 32 insertions(+), 32 deletions(-)

diff --git a/src/pixie/blends.nim b/src/pixie/blends.nim
index 6b04a32..4a5e49b 100644
--- a/src/pixie/blends.nim
+++ b/src/pixie/blends.nim
@@ -11,8 +11,8 @@ when defined(amd64) and allowSimd:
 type
   Blender* = proc(backdrop, source: ColorRGBX): ColorRGBX {.gcsafe, raises: [].}
     ## Function signature returned by blender.
-  Masker* = proc(backdrop, source: uint8): uint8 {.gcsafe, raises: [].}
-    ## Function signature returned by masker.
+  MaskBlender* = proc(backdrop, source: uint8): uint8 {.gcsafe, raises: [].}
+    ## Function signature returned by maskBlender.
 
 when defined(release):
   {.push checks: off.}
@@ -484,29 +484,29 @@ proc maskBlendExclude*(backdrop, source: uint8): uint8 {.inline.} =
   ## Exclude blend masks
   max(backdrop, source) - min(backdrop, source)
 
-proc maskBlendNormalMasker(backdrop, source: uint8): uint8 =
+proc maskBlendNormalMaskBlender(backdrop, source: uint8): uint8 =
   maskBlendNormal(backdrop, source)
 
-proc maskBlendMaskMasker(backdrop, source: uint8): uint8 =
+proc maskBlendMaskMaskBlender(backdrop, source: uint8): uint8 =
   maskBlendMask(backdrop, source)
 
-proc maskBlendSubtractMasker(backdrop, source: uint8): uint8 =
+proc maskBlendSubtractMaskBlender(backdrop, source: uint8): uint8 =
   maskBlendSubtract(backdrop, source)
 
-proc maskBlendExcludeMasker(backdrop, source: uint8): uint8 =
+proc maskBlendExcludeMaskBlender(backdrop, source: uint8): uint8 =
   maskBlendExclude(backdrop, source)
 
-proc maskBlendOverwriteMasker(backdrop, source: uint8): uint8 =
+proc maskBlendOverwriteMaskBlender(backdrop, source: uint8): uint8 =
   source
 
-proc masker*(blendMode: BlendMode): Masker {.raises: [PixieError].} =
+proc maskBlender*(blendMode: BlendMode): MaskBlender {.raises: [PixieError].} =
   ## Returns a blend masking function for a given blend masking mode.
   case blendMode:
-  of NormalBlend: maskBlendNormalMasker
-  of MaskBlend: maskBlendMaskMasker
-  of OverwriteBlend: maskBlendOverwriteMasker
-  of SubtractMaskBlend: maskBlendSubtractMasker
-  of ExcludeMaskBlend: maskBlendExcludeMasker
+  of NormalBlend: maskBlendNormalMaskBlender
+  of MaskBlend: maskBlendMaskMaskBlender
+  of OverwriteBlend: maskBlendOverwriteMaskBlender
+  of SubtractMaskBlend: maskBlendSubtractMaskBlender
+  of ExcludeMaskBlend: maskBlendExcludeMaskBlender
   else:
     raise newException(PixieError, "No masker for " & $blendMode)
 
@@ -672,30 +672,30 @@ when defined(amd64) and allowSimd:
   proc maskBlendExcludeSimd*(backdrop, source: M128i): M128i {.inline.} =
     mm_sub_epi8(mm_max_epu8(backdrop, source), mm_min_epu8(backdrop, source))
 
-  proc maskBlendNormalSimdMasker(backdrop, source: M128i): M128i =
+  proc maskBlendNormalSimdMaskBlender(backdrop, source: M128i): M128i =
     maskBlendNormalSimd(backdrop, source)
 
-  proc maskBlendMaskSimdMasker(backdrop, source: M128i): M128i =
+  proc maskBlendMaskSimdMaskBlender(backdrop, source: M128i): M128i =
     maskBlendMaskSimd(backdrop, source)
 
-  proc maskBlendExcludeSimdMasker(backdrop, source: M128i): M128i =
+  proc maskBlendExcludeSimdMaskBlender(backdrop, source: M128i): M128i =
     maskBlendExcludeSimd(backdrop, source)
 
-  proc maskBlendSubtractSimdMasker(backdrop, source: M128i): M128i =
+  proc maskBlendSubtractSimdMaskBlender(backdrop, source: M128i): M128i =
     maskBlendSubtractSimd(backdrop, source)
 
-  proc maskerSimd*(blendMode: BlendMode): MaskerSimd {.raises: [PixieError].} =
+  proc maskBlenderSimd*(blendMode: BlendMode): MaskerSimd {.raises: [PixieError].} =
     ## Returns a blend masking function with SIMD support.
     case blendMode:
-    of NormalBlend: maskBlendNormalSimdMasker
-    of MaskBlend: maskBlendMaskSimdMasker
+    of NormalBlend: maskBlendNormalSimdMaskBlender
+    of MaskBlend: maskBlendMaskSimdMaskBlender
     of OverwriteBlend: overwriteSimdBlender
-    of SubtractMaskBlend: maskBlendSubtractSimdMasker
-    of ExcludeMaskBlend: maskBlendExcludeSimdMasker
+    of SubtractMaskBlend: maskBlendSubtractSimdMaskBlender
+    of ExcludeMaskBlend: maskBlendExcludeSimdMaskBlender
     else:
       raise newException(PixieError, "No SIMD masker for " & $blendMode)
 
-  proc hasSimdMasker*(blendMode: BlendMode): bool {.inline, raises: [].} =
+  proc hasSimdMaskBlender*(blendMode: BlendMode): bool {.inline, raises: [].} =
     ## Is there a blend masking function with SIMD support?
     blendMode in {
       NormalBlend,
diff --git a/src/pixie/images.nim b/src/pixie/images.nim
index 1f0e26d..ac82d87 100644
--- a/src/pixie/images.nim
+++ b/src/pixie/images.nim
@@ -714,7 +714,7 @@ proc drawUber(
   when type(a) is Image:
     let blender = blendMode.blender()
   else: # a is a Mask
-    let masker = blendMode.masker()
+    let maskBlender = blendMode.maskBlender()
 
   if blendMode == MaskBlend:
     if yMin > 0:
@@ -777,7 +777,7 @@ proc drawUber(
             let sample = b.getRgbaSmooth(srcPos.x, srcPos.y).a
           else: # b is a Mask
             let sample = b.getValueSmooth(srcPos.x, srcPos.y)
-          a.unsafe[x, y] = masker(backdrop, sample)
+          a.unsafe[x, y] = maskBlender(backdrop, sample)
 
         srcPos += dx
 
@@ -972,8 +972,8 @@ proc drawUber(
                   x += 16
                   sx += 16
             else: # is a Mask
-              if blendMode.hasSimdMasker():
-                let maskerSimd = blendMode.maskerSimd()
+              if blendMode.hasSimdMaskBlender():
+                let maskerSimd = blendMode.maskBlenderSimd()
                 for _ in 0 ..< (xStop - xStart) div 16:
                   let backdrop = mm_loadu_si128(a.data[a.dataIndex(x, y)].addr)
                   when type(b) is Image:
@@ -1089,7 +1089,7 @@ proc drawUber(
               let sample = b.unsafe[samplePos.x, samplePos.y].a
             else: # b is a Mask
               let sample = b.unsafe[samplePos.x, samplePos.y]
-            a.unsafe[x, y] = masker(backdrop, sample)
+            a.unsafe[x, y] = maskBlender(backdrop, sample)
           srcPos += dx
 
     if blendMode == MaskBlend:
diff --git a/src/pixie/paths.nim b/src/pixie/paths.nim
index 1fc1e56..4c5455e 100644
--- a/src/pixie/paths.nim
+++ b/src/pixie/paths.nim
@@ -1443,9 +1443,9 @@ proc fillCoverage(
 ) =
   var x = startX
   when defined(amd64) and allowSimd:
-    if blendMode.hasSimdMasker():
+    if blendMode.hasSimdMaskBlender():
       let
-        maskerSimd = blendMode.maskerSimd()
+        maskerSimd = blendMode.maskBlenderSimd()
         vecZero = mm_setzero_si128()
       for _ in 0 ..< coverages.len div 16:
         let
@@ -1465,7 +1465,7 @@ proc fillCoverage(
           mm_storeu_si128(mask.data[index].addr, vecZero)
         x += 16
 
-  let masker = blendMode.masker()
+  let maskBlender = blendMode.maskBlender()
   for x in x ..< startX + coverages.len:
     let coverage = coverages[x - startX]
     if coverage != 0 or blendMode == ExcludeMaskBlend:
@@ -1473,7 +1473,7 @@ proc fillCoverage(
         mask.unsafe[x, y] = coverage
       else:
         let backdrop = mask.unsafe[x, y]
-        mask.unsafe[x, y] = masker(backdrop, coverage)
+        mask.unsafe[x, y] = maskBlender(backdrop, coverage)
     elif blendMode == MaskBlend:
       mask.unsafe[x, y] = 0
 

From 2f2fe303ee36ed8517af03c05936133a7a060ab5 Mon Sep 17 00:00:00 2001
From: Ryan Oldenburg <ryan@guzba.com>
Date: Thu, 16 Jun 2022 23:16:47 -0500
Subject: [PATCH 3/5] use unsafe

---
 src/pixie/paths.nim | 12 ++++--------
 1 file changed, 4 insertions(+), 8 deletions(-)

diff --git a/src/pixie/paths.nim b/src/pixie/paths.nim
index 4c5455e..cc158eb 100644
--- a/src/pixie/paths.nim
+++ b/src/pixie/paths.nim
@@ -1511,10 +1511,8 @@ proc fillHits(
       when defined(amd64):
         let colorVec = mm_set1_epi32(cast[int32](rgbx))
         for _ in 0 ..< fillLen div 4:
-          let
-            index = image.dataIndex(x, y)
-            backdrop = mm_loadu_si128(image.data[index].addr)
-          mm_storeu_si128(image.data[index].addr, blendProc(backdrop, colorVec))
+          let backdrop = mm_loadu_si128(image.unsafe[x, y].addr)
+          mm_storeu_si128(image.unsafe[x, y].addr, blendProc(backdrop, colorVec))
           x += 4
 
   case blendMode:
@@ -1577,10 +1575,8 @@ proc fillHits(
       when defined(amd64):
         let vec255 = mm_set1_epi8(255)
         for _ in 0 ..< fillLen div 16:
-          let
-            index = mask.dataIndex(x, y)
-            backdrop = mm_loadu_si128(mask.data[index].addr)
-          mm_storeu_si128(mask.data[index].addr, blendProc(backdrop, vec255))
+          let backdrop = mm_loadu_si128(mask.unsafe[x, y].addr)
+          mm_storeu_si128(mask.unsafe[x, y].addr, blendProc(backdrop, vec255))
           x += 16
 
   case blendMode:

From 52bd7bef57a7f4e9e284cecf18616e07b34ccf42 Mon Sep 17 00:00:00 2001
From: Ryan Oldenburg <ryan@guzba.com>
Date: Thu, 16 Jun 2022 23:32:19 -0500
Subject: [PATCH 4/5] walkInteger iterator

---
 src/pixie/paths.nim | 96 ++++++++++++++++++++++-----------------------
 1 file changed, 47 insertions(+), 49 deletions(-)

diff --git a/src/pixie/paths.nim b/src/pixie/paths.nim
index cc158eb..72c0160 100644
--- a/src/pixie/paths.nim
+++ b/src/pixie/paths.nim
@@ -1158,7 +1158,7 @@ proc maxEntryCount(partitioning: var Partitioning): int =
 proc fixed32(f: float32): Fixed32 {.inline.} =
   Fixed32(f * 256)
 
-proc integer(p: Fixed32): int {.inline.} =
+proc integer(p: Fixed32): int32 {.inline.} =
   p div 256
 
 proc trunc(p: Fixed32): Fixed32 {.inline.} =
@@ -1223,6 +1223,20 @@ iterator walk(
     if prevAt != width.float32.fixed32 and count != 0:
       echo "Leak detected: ", count, " @ (", prevAt, ", ", y, ")"
 
+iterator walkInteger(
+  hits: seq[(int32, int16)],
+  numHits: int,
+  windingRule: WindingRule,
+  y, width: int
+): (int32, int32) =
+  for (prevAt, at, count) in hits.walk(numHits, windingRule, y, width):
+    let
+      fillStart = prevAt.integer
+      fillLen = at.integer - fillStart
+    if fillLen <= 0:
+      continue
+    yield (fillStart, fillLen)
+
 proc computeCoverage(
   coverages: ptr UncheckedArray[uint8],
   hits: var seq[(Fixed32, int16)],
@@ -1481,22 +1495,6 @@ proc fillCoverage(
     mask.clearUnsafe(0, y, startX, y)
     mask.clearUnsafe(startX + coverages.len, y, mask.width, y)
 
-template walkHits(
-  hits: seq[(int32, int16)],
-  numHits: int,
-  windingRule: WindingRule,
-  y, width: int,
-  inner: untyped
-) =
-  for (prevAt, at, count) in hits.walk(numHits, windingRule, y, width):
-    let
-      fillStart {.inject.} = prevAt.integer
-      fillLen {.inject.} = at.integer - fillStart
-    if fillLen <= 0:
-      continue
-
-    inner
-
 proc fillHits(
   image: Image,
   rgbx: ColorRGBX,
@@ -1506,36 +1504,36 @@ proc fillHits(
   windingRule: WindingRule,
   blendMode: BlendMode
 ) =
-  template simdBlob(image: Image, x: var int, blendProc: untyped) =
+  template simdBlob(image: Image, x: var int, len: int32, blendProc: untyped) =
     when allowSimd:
       when defined(amd64):
         let colorVec = mm_set1_epi32(cast[int32](rgbx))
-        for _ in 0 ..< fillLen div 4:
+        for _ in 0 ..< len div 4:
           let backdrop = mm_loadu_si128(image.unsafe[x, y].addr)
           mm_storeu_si128(image.unsafe[x, y].addr, blendProc(backdrop, colorVec))
           x += 4
 
   case blendMode:
   of OverwriteBlend:
-    walkHits hits, numHits, windingRule, y, image.width:
-      fillUnsafe(image.data, rgbx, image.dataIndex(fillStart, y), fillLen)
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, image.width):
+      fillUnsafe(image.data, rgbx, image.dataIndex(start, y), len)
 
   of NormalBlend:
-    walkHits hits, numHits, windingRule, y, image.width:
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, image.width):
       if rgbx.a == 255:
-        fillUnsafe(image.data, rgbx, image.dataIndex(fillStart, y), fillLen)
+        fillUnsafe(image.data, rgbx, image.dataIndex(start, y), len)
       else:
-        var x = fillStart
-        simdBlob(image, x, blendNormalSimd)
-        for x in x ..< fillStart + fillLen:
+        var x = start
+        simdBlob(image, x, len, blendNormalSimd)
+        for x in x ..< start + len:
           let backdrop = image.unsafe[x, y]
           image.unsafe[x, y] = blendNormal(backdrop, rgbx)
 
   of MaskBlend:
     var filledTo = startX
-    walkHits hits, numHits, windingRule, y, image.width:
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, image.width):
       block: # Clear any gap between this fill and the previous fill
-        let gapBetween = fillStart - filledTo
+        let gapBetween = start - filledTo
         if gapBetween > 0:
           fillUnsafe(
             image.data,
@@ -1543,12 +1541,12 @@ proc fillHits(
             image.dataIndex(filledTo, y),
             gapBetween
           )
-        filledTo = fillStart + fillLen
+        filledTo = start + len
       block: # Handle this fill
         if rgbx.a != 255:
-          var x = fillStart
-          simdBlob(image, x, blendMaskSimd)
-          for x in x ..< fillStart + fillLen:
+          var x = start
+          simdBlob(image, x, len, blendMaskSimd)
+          for x in x ..< start + len:
             let backdrop = image.unsafe[x, y]
             image.unsafe[x, y] = blendMask(backdrop, rgbx)
 
@@ -1557,8 +1555,8 @@ proc fillHits(
 
   else:
     let blender = blendMode.blender()
-    walkHits hits, numHits, windingRule, y, image.width:
-      for x in fillStart ..< fillStart + fillLen:
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, image.width):
+      for x in start ..< start + len:
         let backdrop = image.unsafe[x, y]
         image.unsafe[x, y] = blender(backdrop, rgbx)
 
@@ -1570,44 +1568,44 @@ proc fillHits(
   windingRule: WindingRule,
   blendMode: BlendMode
 ) =
-  template simdBlob(mask: Mask, x: var int, blendProc: untyped) =
+  template simdBlob(mask: Mask, x: var int, len: int32, blendProc: untyped) =
     when allowSimd:
       when defined(amd64):
         let vec255 = mm_set1_epi8(255)
-        for _ in 0 ..< fillLen div 16:
+        for _ in 0 ..< len div 16:
           let backdrop = mm_loadu_si128(mask.unsafe[x, y].addr)
           mm_storeu_si128(mask.unsafe[x, y].addr, blendProc(backdrop, vec255))
           x += 16
 
   case blendMode:
   of NormalBlend, OverwriteBlend:
-    walkHits hits, numHits, windingRule, y, mask.width:
-      fillUnsafe(mask.data, 255, mask.dataIndex(fillStart, y), fillLen)
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, mask.width):
+      fillUnsafe(mask.data, 255, mask.dataIndex(start, y), len)
 
   of MaskBlend:
     var filledTo = startX
-    walkHits hits, numHits, windingRule,y,  mask.width:
-      let gapBetween = fillStart - filledTo
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, mask.width):
+      let gapBetween = start - filledTo
       if gapBetween > 0:
         fillUnsafe(mask.data, 0, mask.dataIndex(filledTo, y), gapBetween)
-      filledTo = fillStart + fillLen
+      filledTo = start + len
 
     mask.clearUnsafe(0, y, startX, y)
     mask.clearUnsafe(filledTo, y, mask.width, y)
 
   of SubtractMaskBlend:
-    walkHits hits, numHits, windingRule, y, mask.width:
-      var x = fillStart
-      simdBlob(mask, x, maskBlendSubtractSimd)
-      for x in x ..< fillStart + fillLen:
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, mask.width):
+      var x = start
+      simdBlob(mask, x, len, maskBlendSubtractSimd)
+      for x in x ..< start + len:
         let backdrop = mask.unsafe[x, y]
         mask.unsafe[x, y] = maskBlendSubtract(backdrop, 255)
 
   of ExcludeMaskBlend:
-    walkHits hits, numHits, windingRule, y, mask.width:
-      var x = fillStart
-      simdBlob(mask, x, maskBlendExcludeSimd)
-      for x in x ..< fillStart + fillLen:
+    for (start, len) in hits.walkInteger(numHits, windingRule, y, mask.width):
+      var x = start
+      simdBlob(mask, x, len, maskBlendExcludeSimd)
+      for x in x ..< start + len:
         let backdrop = mask.unsafe[x, y]
         mask.unsafe[x, y] = maskBlendExclude(backdrop, 255)
 

From b0303245f5306cda8a6e64fe1eb5d2cc28edbf2e Mon Sep 17 00:00:00 2001
From: Ryan Oldenburg <ryan@guzba.com>
Date: Fri, 17 Jun 2022 00:19:26 -0500
Subject: [PATCH 5/5] f

---
 src/pixie/paths.nim | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/pixie/paths.nim b/src/pixie/paths.nim
index 72c0160..d1f2637 100644
--- a/src/pixie/paths.nim
+++ b/src/pixie/paths.nim
@@ -1158,7 +1158,7 @@ proc maxEntryCount(partitioning: var Partitioning): int =
 proc fixed32(f: float32): Fixed32 {.inline.} =
   Fixed32(f * 256)
 
-proc integer(p: Fixed32): int32 {.inline.} =
+proc integer(p: Fixed32): int {.inline.} =
   p div 256
 
 proc trunc(p: Fixed32): Fixed32 {.inline.} =
@@ -1228,7 +1228,7 @@ iterator walkInteger(
   numHits: int,
   windingRule: WindingRule,
   y, width: int
-): (int32, int32) =
+): (int, int) =
   for (prevAt, at, count) in hits.walk(numHits, windingRule, y, width):
     let
       fillStart = prevAt.integer
@@ -1504,7 +1504,7 @@ proc fillHits(
   windingRule: WindingRule,
   blendMode: BlendMode
 ) =
-  template simdBlob(image: Image, x: var int, len: int32, blendProc: untyped) =
+  template simdBlob(image: Image, x: var int, len: int, blendProc: untyped) =
     when allowSimd:
       when defined(amd64):
         let colorVec = mm_set1_epi32(cast[int32](rgbx))
@@ -1568,7 +1568,7 @@ proc fillHits(
   windingRule: WindingRule,
   blendMode: BlendMode
 ) =
-  template simdBlob(mask: Mask, x: var int, len: int32, blendProc: untyped) =
+  template simdBlob(mask: Mask, x: var int, len: int, blendProc: untyped) =
     when allowSimd:
       when defined(amd64):
         let vec255 = mm_set1_epi8(255)