Chia-Network · hoffmang9 · Feb 7, 2026 · Feb 7, 2026 · Feb 7, 2026 · Feb 7, 2026
diff --git a/.github/workflows/build-c-libraries.yml b/.github/workflows/build-c-libraries.yml
@@ -21,6 +21,7 @@ permissions:
 
 jobs:
   build-c-libraries:
+    if: ${{ false }}
     name: C Libraries - ${{ matrix.os.name }} ${{ matrix.arch.name }}
     runs-on: ${{ matrix.os.runs-on[matrix.arch.matrix] }}
     strategy:

diff --git a/.github/workflows/build-riscv64.yml b/.github/workflows/build-riscv64.yml
@@ -21,6 +21,7 @@ permissions:
 
 jobs:
   build_wheels:
+    if: ${{ false }}
     name: ${{ matrix.os.emoji }} 📦 Build ${{ matrix.python.major-dot-minor }}
     runs-on: ${{ matrix.os.runs-on }}
     strategy:
@@ -80,6 +81,7 @@ jobs:
           path: ./dist
           if-no-files-found: error
   upload:
+    if: ${{ false }}
     name: Upload to Chia PyPI
     runs-on: ubuntu-latest
     needs:

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
@@ -21,6 +21,7 @@ permissions:
 
 jobs:
   build-wheels:
+    if: ${{ false }}
     name: Wheel - ${{ matrix.os.name }} ${{ matrix.python.major-dot-minor }} ${{ matrix.arch.name }}
     runs-on: ${{ matrix.os.runs-on[matrix.arch.matrix] }}
     strategy:
@@ -123,6 +124,7 @@ jobs:
         path: ./dist
 
   build-sdist:
+    if: ${{ false }}
     name: sdist - ${{ matrix.os.name }} ${{ matrix.python.major-dot-minor }} ${{ matrix.arch.name }}
     runs-on: ${{ matrix.os.runs-on[matrix.arch.matrix] }}
     strategy:
@@ -166,6 +168,7 @@ jobs:
         path: ./dist
 
   check:
+    if: ${{ false }}
     name: Check - ${{ matrix.os.name }} ${{ matrix.python.major-dot-minor }} ${{ matrix.arch.name }}
     runs-on: ${{ matrix.os.runs-on[matrix.arch.matrix] }}
     strategy:
@@ -208,6 +211,7 @@ jobs:
         mypy --config-file mypi.ini setup.py tests
 
   upload:
+    if: ${{ false }}
     name: Upload to PyPI - ${{ matrix.os.name }} ${{ matrix.python.major-dot-minor }} ${{ matrix.arch.name }}
     runs-on: ${{ matrix.os.runs-on[matrix.arch.matrix] }}
     needs:

diff --git a/.github/workflows/check-commit-signing.yml b/.github/workflows/check-commit-signing.yml
@@ -16,6 +16,7 @@ concurrency:
 
 jobs:
   check-commit-signing:
+    if: ${{ false }}
     name: Check commit signing
     runs-on: [ubuntu-latest]
     timeout-minutes: 5

diff --git a/.github/workflows/codeql-analysis.yml b/.github/workflows/codeql-analysis.yml
@@ -22,6 +22,7 @@ on:
 
 jobs:
   analyze:
+    if: ${{ false }}
     name: Analyze
     runs-on: ubuntu-latest
     permissions:

diff --git a/.github/workflows/dependency-review.yml b/.github/workflows/dependency-review.yml
@@ -13,7 +13,7 @@ permissions:
 
 jobs:
   dependency-review:
-    if: github.repository_owner == 'Chia-Network'
+    if: ${{ false }}
     runs-on: ubuntu-latest
     steps:
       - name: "Checkout Repository"

diff --git a/.github/workflows/hw-build.yml b/.github/workflows/hw-build.yml
@@ -22,6 +22,7 @@ permissions:
 
 jobs:
   build-hw:
+    if: ${{ false }}
     name: Build HW VDF Client
     runs-on: [ubuntu-22.04]
     steps:

diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
@@ -20,6 +20,7 @@ permissions:
 
 jobs:
   fuzz_targets:
+    if: ${{ false }}
     name: Run fuzzers (${{ matrix.target }})
     runs-on: ubuntu-latest
     env:
@@ -59,6 +60,7 @@ jobs:
           cargo +nightly fuzz run ${{ matrix.target }} -- -max_total_time=600
 
   lint:
+    if: ${{ false }}
     name: Lint
     runs-on: ubuntu-latest
     steps:
@@ -76,6 +78,7 @@ jobs:
         run: cargo clippy
 
   test:
+    if: ${{ false }}
     name: Test (${{ matrix.os.name }} ${{ matrix.arch.name }})
     runs-on: ${{ matrix.os.runs-on[matrix.arch.matrix] }}
 
@@ -161,6 +164,7 @@ jobs:
         run: cargo test && cargo test --release
 
   build_crate:
+    if: ${{ false }}
     name: Build crate
     needs: [lint, test]
     runs-on: ubuntu-latest

diff --git a/.github/workflows/stale-issue.yml b/.github/workflows/stale-issue.yml
@@ -6,6 +6,7 @@ on:
 
 jobs:
   stale:
+    if: ${{ false }}
     runs-on: ubuntu-latest
     steps:
       - uses: chia-network/stale@main

diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml
@@ -19,13 +19,15 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        os: [macos-13-intel, macos-13-arm64, ubuntu-latest, windows-latest]
-        config: [optimized=1, TSAN=1, ASAN=1]
-        exclude:
+        include:
+          - os: macos-13-intel
+            config: optimized=1
+          - os: macos-13-arm64
+            config: optimized=1
+          - os: ubuntu-latest
+            config: optimized=1
           - os: windows-latest
-            config: ASAN=1
-          - os: windows-latest
-            config: TSAN=1
+            config: optimized=1
 
     steps:
     - name: Checkout code
@@ -193,14 +195,11 @@ jobs:
         cd src
         echo "Running 1weso_test"
         ./1weso_test
-        echo "Running 2weso_test"
-        ./2weso_test
+        # PERF_INVESTIGATION_TEMP: keep non-target tests at smoke level for faster perf investigation turnaround.
+        echo "Running 2weso_test with 10 iterations (smoke)"
+        ./2weso_test 10
         echo "Running prover_test"
-        if [[ "${{ matrix.os }}" == ubuntu* ]]; then
-          ./prover_test
-        else
-          CHIAVDF_PROVER_TEST_FAST=1 ./prover_test
-        fi
+        CHIAVDF_PROVER_TEST_FAST=1 ./prover_test
 
     - name: Run vdf tests (short)
       if: matrix.config != 'optimized=1' && !startsWith(matrix.os, 'windows')
@@ -246,8 +245,9 @@ jobs:
         }
         Write-Host "Running 1weso_test"
         Invoke-TestExe "1weso_test"
-        Write-Host "Running 2weso_test"
-        Invoke-TestExe "2weso_test"
+        # PERF_INVESTIGATION_TEMP: keep non-target tests at smoke level for faster perf investigation turnaround.
+        Write-Host "Running 2weso_test with 10 iterations (smoke)"
+        Invoke-TestExe "2weso_test" @("10")
         Write-Host "Running prover_test"
         $env:CHIAVDF_PROVER_TEST_FAST = "1"
         Invoke-TestExe "prover_test"
@@ -256,20 +256,82 @@ jobs:
       if: matrix.config == 'optimized=1' && !startsWith(matrix.os, 'windows')
       run: |
         cd src
-        echo "Benchmarking vdf_bench with 2,000,000 iterations of square_asm"
-        ./vdf_bench square_asm 2000000
+        # PERF_INVESTIGATION_TEMP: lower non-target benchmark load to speed overall CI turnaround.
+        echo "Benchmarking vdf_bench with 250,000 iterations of square_asm"
+        CHIAVDF_PERF_TRACE=1 ./vdf_bench square_asm 250000
 
-    - name: Benchmark vdf_bench square (Windows)
+    - name: Benchmark vdf_bench square (Windows, perf investigation)
       if: matrix.config == 'optimized=1' && startsWith(matrix.os, 'windows')
       shell: pwsh
       run: |
+        # PERF_INVESTIGATION_TEMP: repeated benchmark harness for Windows regression isolation.
         cd build
         $dllPaths = @()
         if ($env:MPIR_ROOT -and (Test-Path "$env:MPIR_ROOT\bin")) { $dllPaths += "$env:MPIR_ROOT\bin" }
         if (Test-Path "$env:GITHUB_WORKSPACE\mpir_gc_x64") { $dllPaths += "$env:GITHUB_WORKSPACE\mpir_gc_x64" }
         if ($dllPaths.Count -gt 0) { $env:PATH = ($dllPaths -join ';') + ';' + $env:PATH }
-        Write-Host "Benchmarking vdf_bench with 2,000,000 iterations of square_asm"
-        & .\vdf_bench.exe square_asm 2000000
-        Write-Host "vdf_bench exit code: $LASTEXITCODE"
-        if ($LASTEXITCODE -ne 0) { exit $LASTEXITCODE }
+        $env:CHIAVDF_PERF_TRACE = "1"
+
+        Write-Host "PERF_INVESTIGATION_TEMP warmup: square_asm 10000"
+        & .\vdf_bench.exe square_asm 10000
+        if ($LASTEXITCODE -ne 0) {
+          Write-Host "warmup exit code: $LASTEXITCODE"
+          exit $LASTEXITCODE
+        }
+
+        $repetitions = 5
+        $iterations = 1000000
+        $ipsValues = @()
+        $metricLines = @()
+        $metricsPath = Join-Path $env:RUNNER_TEMP "PERF_INVESTIGATION_TEMP_windows_metrics.txt"
+        "PERF_INVESTIGATION_TEMP begin" | Out-File -FilePath $metricsPath -Encoding utf8
+        for ($i = 1; $i -le $repetitions; $i++) {
+          Write-Host "PERF_INVESTIGATION_TEMP run $i/${repetitions}: square_asm $iterations"
+          $runOutput = & .\vdf_bench.exe square_asm $iterations 2>&1
+          $exitCode = $LASTEXITCODE
+          $runOutput | ForEach-Object { Write-Host $_ }
+          if ($exitCode -ne 0) {
+            Write-Host "vdf_bench run $i exit code: $exitCode"
+            exit $exitCode
+          }
+          $metricLine = $runOutput | Select-String -Pattern 'PERF_INVESTIGATION_TEMP mode=square_asm .*ips=([0-9]+(?:\.[0-9]+)?)' | Select-Object -Last 1
+          if (-not $metricLine) {
+            throw "Missing PERF_INVESTIGATION_TEMP metric line in run $i output"
+          }
+          $metricText = $metricLine.ToString()
+          $metricLines += $metricText
+          $metricText | Out-File -FilePath $metricsPath -Encoding utf8 -Append
+          $ips = [double]$metricLine.Matches[0].Groups[1].Value
+          $ipsValues += $ips
+        }
+
+        $avg = ($ipsValues | Measure-Object -Average).Average
+        $min = ($ipsValues | Measure-Object -Minimum).Minimum
+        $max = ($ipsValues | Measure-Object -Maximum).Maximum
+        $variance = 0.0
+        foreach ($v in $ipsValues) {
+          $delta = $v - $avg
+          $variance += $delta * $delta
+        }
+        $stddev = [Math]::Sqrt($variance / $ipsValues.Count)
+        $joinedIps = ($ipsValues | ForEach-Object { "{0:N3}" -f $_ }) -join ", "
+
+        Write-Host ("PERF_INVESTIGATION_TEMP summary runs={0} iterations={1} ips_values=[{2}] avg={3:N3} stddev={4:N3} min={5:N3} max={6:N3}" -f $repetitions, $iterations, $joinedIps, $avg, $stddev, $min, $max)
+        ("PERF_INVESTIGATION_TEMP summary runs={0} iterations={1} ips_values=[{2}] avg={3:N3} stddev={4:N3} min={5:N3} max={6:N3}" -f $repetitions, $iterations, $joinedIps, $avg, $stddev, $min, $max) | Out-File -FilePath $metricsPath -Encoding utf8 -Append
+        "## PERF_INVESTIGATION_TEMP Windows square_asm`n" | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+        ("- runs: {0}" -f $repetitions) | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+        ("- iterations_per_run: {0}" -f $iterations) | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+        ("- ips_values: {0}" -f $joinedIps) | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+        ("- avg_ips: {0:N3}" -f $avg) | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+        ("- stddev_ips: {0:N3}" -f $stddev) | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+        ("- min_ips: {0:N3}" -f $min) | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+        ("- max_ips: {0:N3}" -f $max) | Out-File -FilePath $env:GITHUB_STEP_SUMMARY -Encoding utf8 -Append
+
+    - name: Upload Windows perf investigation metrics
+      if: matrix.config == 'optimized=1' && startsWith(matrix.os, 'windows')
+      uses: actions/upload-artifact@v4
+      with:
+        name: PERF_INVESTIGATION_TEMP-windows-square-asm-metrics
+        path: ${{ runner.temp }}/PERF_INVESTIGATION_TEMP_windows_metrics.txt
+        if-no-files-found: error
 
diff --git a/README.md b/README.md
@@ -72,7 +72,6 @@ AVX runtime flags:
 
 - `CHIAVDF_LOG_AVX=1`: emit AVX detection logs at startup
 - `CHIA_DISABLE_AVX2=1`: disable AVX2 path even when supported
-- `CHIA_FORCE_AVX2=1`: force AVX2 path
 - `CHIA_DISABLE_AVX512_IFMA=1`: disable AVX-512 IFMA path
 - `CHIA_ENABLE_AVX512_IFMA=1`: enable AVX-512 IFMA path when CPUID support is present
 - `CHIA_FORCE_AVX512_IFMA=1`: force AVX-512 IFMA path

diff --git a/src/callback.h b/src/callback.h
@@ -6,7 +6,6 @@
 #include <algorithm>
 #include <atomic>
 #include <limits>
-#include <mutex>
 #include <stdexcept>
 
 // Applies to n-weso.
@@ -134,32 +133,44 @@ class TwoWesolowskiCallback: public WesolowskiCallback {
         forms_capacity = space_needed;
         forms.reset(new form[space_needed]);
         forms[0] = f;
-        kl = 10;
-        switch_iters = -1;
+        switch_iters.store(0, std::memory_order_relaxed);
+        switch_index.store(0, std::memory_order_relaxed);
+        large_constants.store(false, std::memory_order_relaxed);
+        // forms[0] is valid immediately at construction.
+        max_published_power.store(0, std::memory_order_relaxed);
     }
 
     void IncreaseConstants(uint64_t num_iters) {
-        std::lock_guard<std::mutex> lk(forms_mutex);
-        kl = 100;
-        switch_iters = num_iters;
-        switch_index = num_iters / 10;
+        // Publish the switch in a single direction: false -> true.
+        switch_iters.store(num_iters, std::memory_order_release);
+        switch_index.store(num_iters / 10, std::memory_order_release);
+        large_constants.store(true, std::memory_order_release);
     }
 
     int GetPosition(uint64_t power) {
-        std::lock_guard<std::mutex> lk(forms_mutex);
         return GetPositionUnlocked(power);
     }
 
+    bool IsPublished(uint64_t power) const {
+        return max_published_power.load(std::memory_order_acquire) >= power;
+    }
+
     int GetPositionUnlocked(uint64_t power) const {
-        if (switch_iters == -1 || power < switch_iters) {
+        if (!large_constants.load(std::memory_order_acquire)) {
             return power / 10;
-        } else {
-            return (switch_index + (power - switch_iters) / 100);
         }
+        const uint64_t switch_iters_local = switch_iters.load(std::memory_order_acquire);
+        if (power < switch_iters_local) {
+            return power / 10;
+        }
+        const uint64_t switch_index_local = switch_index.load(std::memory_order_acquire);
+        return (switch_index_local + (power - switch_iters_local) / 100);
     }
 
     form GetFormCopy(uint64_t power) {
-        std::lock_guard<std::mutex> lk(forms_mutex);
+        if (!IsPublished(power)) {
+            throw std::runtime_error("TwoWesolowskiCallback::GetFormCopy not yet published");
+        }
         const int pos = GetPositionUnlocked(power);
         if (pos < 0 || static_cast<size_t>(pos) >= forms_capacity) {
             throw std::runtime_error("TwoWesolowskiCallback::GetFormCopy out of bounds");
@@ -168,28 +179,29 @@ class TwoWesolowskiCallback: public WesolowskiCallback {
     }
 
     bool LargeConstants() {
-        std::lock_guard<std::mutex> lk(forms_mutex);
-        return kl == 100;
+        return large_constants.load(std::memory_order_acquire);
     }
 
     void OnIteration(int type, void *data, uint64_t iteration) {
         iteration++;
-        std::lock_guard<std::mutex> lk(forms_mutex);
+        const uint32_t kl = large_constants.load(std::memory_order_acquire) ? 100 : 10;
         if (iteration % kl == 0) {
             const int pos = GetPositionUnlocked(iteration);
             if (pos < 0 || static_cast<size_t>(pos) >= forms_capacity) {
                 throw std::runtime_error("TwoWesolowskiCallback::OnIteration out of bounds");
             }
             form* mulf = &forms[static_cast<size_t>(pos)];
             SetForm(type, data, mulf);
+            // Publish this completed checkpoint after writing the form data.
+            max_published_power.store(iteration, std::memory_order_release);
         }
     }
 
   private:
-    uint64_t switch_index;
-    int64_t switch_iters;
-    uint32_t kl;
-    std::mutex forms_mutex;
+    std::atomic<uint64_t> switch_index;
+    std::atomic<uint64_t> switch_iters;
+    std::atomic<bool> large_constants;
+    std::atomic<uint64_t> max_published_power;
 };
 
 class FastAlgorithmCallback : public WesolowskiCallback {
-Original file line number
+Diff line change
@@ Expand Up / @@ -6,6 +6,7 @@ on: @@
     jobs:
       stale:
+        if: ${{ false }}
         runs-on: ubuntu-latest
         steps:
           - uses: chia-network/stale@main
@@ Expand Down @@