From dee33ff46f95e2d3d81279f5a17f2c5343fb21e2 Mon Sep 17 00:00:00 2001
From: arvidn <arvid@libtorrent.org>
Date: Mon, 22 Dec 2025 13:13:43 +0100
Subject: [PATCH 1/2] improve some of the tools. Make the python scripts to
 generate test cases not depend on CWD. Add comments to benchmark-clvm-costs

---
 tools/generate-keccak-tests.py       |  4 ++-
 tools/generate-secp256k1-tests.py    |  4 ++-
 tools/generate-secp256r1-tests.py    |  5 ++--
 tools/generate-sha256-tests.py       |  4 ++-
 tools/src/bin/benchmark-clvm-cost.rs | 38 +++++++++++++++++++++++-----
 5 files changed, 44 insertions(+), 11 deletions(-)

diff --git a/tools/generate-keccak-tests.py b/tools/generate-keccak-tests.py
index 1c14fa57d..5e8cb56e1 100644
--- a/tools/generate-keccak-tests.py
+++ b/tools/generate-keccak-tests.py
@@ -1,3 +1,4 @@
+from pathlib import Path
 from eth_hash.auto import keccak
 from random import randbytes, randint, seed, sample
 from more_itertools import sliced
@@ -9,7 +10,8 @@
 
 SIZE = 100
 
-with open("../op-tests/test-keccak256-generated.txt", "w+") as f:
+p = Path(__file__).parent.parent / "op-tests/test-keccak256-generated.txt"
+with open(p, "w+") as f:
     f.write("; This file was generated by tools/generate-keccak-tests.py\n\n")
 
     for i in range(SIZE):
diff --git a/tools/generate-secp256k1-tests.py b/tools/generate-secp256k1-tests.py
index d9b83ef40..a0df23e22 100644
--- a/tools/generate-secp256k1-tests.py
+++ b/tools/generate-secp256k1-tests.py
@@ -1,3 +1,4 @@
+from pathlib import Path
 from secp256k1 import PublicKey, PrivateKey
 from hashlib import sha256
 from random import randbytes, randint, seed, sample
@@ -39,7 +40,8 @@ def print_validation_test_case(f, num_cases, filter_pk, filter_msg, filter_sig,
     secret_keys.append(PrivateKey())
 
 
-with open("../op-tests/test-secp256k1.txt", "w+") as f:
+p = Path(__file__).parent.parent / "op-tests/test-secp256k1.txt"
+with open(p, "w+") as f:
     f.write("; This file was generated by tools/generate-secp256k1-tests.py\n\n")
 
     print_validation_test_case(f, SIZE, lambda pk: pk, lambda msg: msg, lambda sig: sig, "0")
diff --git a/tools/generate-secp256r1-tests.py b/tools/generate-secp256r1-tests.py
index 70c497e7d..76d644a37 100644
--- a/tools/generate-secp256r1-tests.py
+++ b/tools/generate-secp256r1-tests.py
@@ -1,3 +1,4 @@
+from pathlib import Path
 from ecdsa import SigningKey, NIST256p
 from hashlib import sha256
 from random import randbytes, randint, seed, sample
@@ -38,8 +39,8 @@ def print_validation_test_case(f, num_cases, filter_pk, filter_msg, filter_sig,
 for i in range(SIZE):
     secret_keys.append(SigningKey.generate(curve=NIST256p, hashfunc=sha256))
 
-
-with open("../op-tests/test-secp256r1.txt", "w+") as f:
+p = Path(__file__).parent.parent / "op-tests/test-secp256r1.txt"
+with open(p, "w+") as f:
     f.write("; This file was generated by tools/generate-secp256r1-tests.py\n\n")
 
     print_validation_test_case(f, SIZE, lambda pk: pk, lambda msg: msg, lambda sig: sig, "0")
diff --git a/tools/generate-sha256-tests.py b/tools/generate-sha256-tests.py
index 017a623a9..06445d830 100644
--- a/tools/generate-sha256-tests.py
+++ b/tools/generate-sha256-tests.py
@@ -1,3 +1,4 @@
+from pathlib import Path
 from random import randbytes, randint, seed, choice
 from hashlib import sha256
 
@@ -6,7 +7,8 @@
 
 test_cases = set()
 
-with open("../op-tests/test-sha256.txt", "w+") as f:
+p = Path(__file__).parent.parent / "op-tests/test-sha256.txt"
+with open(p, "w+") as f:
     f.write("; This file was generated by tools/generate-sha256-tests.py\n\n")
 
     for i in range(0, SIZE):
diff --git a/tools/src/bin/benchmark-clvm-cost.rs b/tools/src/bin/benchmark-clvm-cost.rs
index 435423649..8e03a0bfe 100644
--- a/tools/src/bin/benchmark-clvm-cost.rs
+++ b/tools/src/bin/benchmark-clvm-cost.rs
@@ -7,6 +7,9 @@ use std::fs::{create_dir_all, File};
 use std::io::{sink, Write};
 use std::time::Instant;
 
+// When specifying the signature of operators, some arguments may be fixed
+// constants. The None argument slots will be replaced by the benchmark for the
+// various invocations of the operator.
 #[derive(Clone, Copy)]
 enum Placeholder {
     SingleArg(Option<NodePtr>),
@@ -14,6 +17,7 @@ enum Placeholder {
     ThreeArgs(Option<NodePtr>, Option<NodePtr>, Option<NodePtr>),
 }
 
+// This enum is used as the concrete arguments to a call, after substitution
 #[derive(Clone, Copy)]
 enum OpArgs {
     SingleArg(NodePtr),
@@ -120,7 +124,7 @@ fn time_invocation(a: &mut Allocator, op: u32, arg: OpArgs, flags: u32) -> f64 {
     //println!("{:x?}", &Node::new(a, call));
     let dialect = ChiaDialect::new(0);
     let start = Instant::now();
-    let r = run_program(a, &dialect, call, a.nil(), 11000000000);
+    let r = run_program(a, &dialect, call, a.nil(), 11_000_000_000);
     if (flags & ALLOW_FAILURE) == 0 {
         r.unwrap();
     }
@@ -132,7 +136,8 @@ fn time_invocation(a: &mut Allocator, op: u32, arg: OpArgs, flags: u32) -> f64 {
 }
 
 // returns the time per byte
-// measures run-time of many calls
+// measures run-time of many calls with the variable argument substituted for
+// buffers of variying sizes
 fn time_per_byte(a: &mut Allocator, op: &Operator, output: &mut dyn Write) -> f64 {
     let checkpoint = a.checkpoint();
     let mut samples = Vec::<(f64, f64)>::new();
@@ -185,7 +190,7 @@ fn time_per_arg(a: &mut Allocator, op: &Operator, output: &mut dyn Write) -> f64
         for i in (0..1000).step_by(5) {
             let call = build_call(a, op.opcode, arg, i, op.extra);
             let start = Instant::now();
-            let r = run_program(a, &dialect, call, a.nil(), 11000000000);
+            let r = run_program(a, &dialect, call, a.nil(), 11_000_000_000);
             if (op.flags & ALLOW_FAILURE) == 0 {
                 r.unwrap();
             }
@@ -203,8 +208,9 @@ fn time_per_arg(a: &mut Allocator, op: &Operator, output: &mut dyn Write) -> f64
 }
 
 // measure run-time of many *nested* calls, to establish how much longer it
-// takes, approximately, for each additional nesting. The per_arg_time is
-// subtracted to get the base cost
+// takes for each additional nested call. The per_arg_time is subtracted to get
+// the base cost. This only works for operators that can take their return
+// value as an argument
 fn base_call_time(
     a: &mut Allocator,
     op: &Operator,
@@ -229,7 +235,7 @@ fn base_call_time(
             a.restore_checkpoint(&checkpoint);
             let call = build_nested_call(a, op.opcode, arg, i, op.extra);
             let start = Instant::now();
-            let r = run_program(a, &dialect, call, a.nil(), 11000000000);
+            let r = run_program(a, &dialect, call, a.nil(), 11_000_000_000);
             if (op.flags & ALLOW_FAILURE) == 0 {
                 r.unwrap();
             }
@@ -268,11 +274,31 @@ fn base_call_time_no_nest(a: &mut Allocator, op: &Operator, per_arg_time: f64) -
     (total_time - per_arg_time * num_samples as f64) / num_samples as f64
 }
 
+// measures run-time of many calls with the variable argument substituted for
+// buffers of variying sizes
 const PER_BYTE_COST: u32 = 1;
+
+// measures the run-time of many calls with varying number of arguments, to
+// establish how much time each additional argument contributes
 const PER_ARG_COST: u32 = 2;
+
+// measure run-time of many *nested* calls, to establish how much longer it
+// takes for each additional nested call. The per_arg_time is subtracted to get
+// the base cost. This only works for operators that can take their return
+// value as an argument
 const NESTING_BASE_COST: u32 = 4;
+
+// If the time doesn't grow linearly, but exponentially, this flag must be used
+// to square the samples before we run linear regression. It's an approximation.
 const EXPONENTIAL_COST: u32 = 8;
+
+// This modifies the PER_ARG_COST to use large buffers. This is useful when the
+// cost per byte is very low, and we need large buffers to measure it
 const LARGE_BUFFERS: u32 = 16;
+
+// Allow the operator to fail. This is useful for signature validation
+// functions. They must take just as long to execute as a successful run for this
+// to work as expected.
 const ALLOW_FAILURE: u32 = 32;
 
 struct Operator {

From df522380aa9c1e2a4b7c0454285f8b7433a67057 Mon Sep 17 00:00:00 2001
From: arvidn <arvid@libtorrent.org>
Date: Mon, 22 Dec 2025 13:39:08 +0100
Subject: [PATCH 2/2] specify cost factor on the command line, rather than hard
 coding it

---
 tools/src/bin/benchmark-clvm-cost.rs | 53 +++++++++++++++++++++-------
 1 file changed, 41 insertions(+), 12 deletions(-)

diff --git a/tools/src/bin/benchmark-clvm-cost.rs b/tools/src/bin/benchmark-clvm-cost.rs
index 8e03a0bfe..fe42f82fb 100644
--- a/tools/src/bin/benchmark-clvm-cost.rs
+++ b/tools/src/bin/benchmark-clvm-cost.rs
@@ -313,6 +313,18 @@ struct Operator {
 #[derive(Parser, Debug)]
 #[command(author, version, about, long_about = None)]
 struct Args {
+    /// Only benchmark a single operator, by specifying its name
+    #[arg(long)]
+    only_operator: Option<String>,
+
+    /// Multiply timings (in nanoseconds) by this factor to get cost
+    #[arg(long)]
+    cost_factor: Option<f64>,
+
+    /// List available operators, by name, and exit
+    #[arg(long)]
+    list_operators: bool,
+
     /// enable plotting of measurements
     #[arg(short, long, default_value_t = false)]
     plot: bool,
@@ -540,26 +552,37 @@ pub fn main() {
         },
     ];
 
-    // this "magic" scaling depends on the computer you run the tests on.
-    // It's calibrated against the timing of point_add, which has a cost
-    let cost_scale = ((101094.0 / 39000.0) + (1343980.0 / 131000.0)) / 2.0;
-    let base_cost_scale = 101094.0 / 42500.0;
-    let arg_cost_scale = 1343980.0 / 129000.0;
-    println!("cost scale: {cost_scale}");
-    println!("base cost scale: {base_cost_scale}");
-    println!("arg cost scale: {arg_cost_scale}");
+    if options.list_operators {
+        for op in &ops {
+            println!("{}", op.name);
+        }
+        return;
+    }
+
+    if let Some(cost_scale) = options.cost_factor {
+        println!("cost scale: {cost_scale}");
+    }
 
     let mut gnuplot = maybe_open(options.plot, "gen", "graphs.gnuplot");
     writeln!(gnuplot, "set term png size 1200,600").expect("failed to write");
     writeln!(gnuplot, "set key top right").expect("failed to write");
 
     for op in &ops {
+        // If an operator name was specified, skip all other operators
+        if let Some(ref name) = options.only_operator {
+            if op.name != name {
+                continue;
+            }
+        }
+
         println!("opcode: {} ({})", op.name, op.opcode);
         let time_per_byte = if (op.flags & PER_BYTE_COST) != 0 {
             let mut output = maybe_open(options.plot, op.name, "per-byte.log");
             let time_per_byte = time_per_byte(&mut a, op, &mut *output);
             println!("   time: per-byte: {time_per_byte:.2}ns");
-            println!("   cost: per-byte: {:.0}", time_per_byte * cost_scale);
+            if let Some(cost_scale) = options.cost_factor {
+                println!("   cost: per-byte: {:.0}", time_per_byte * cost_scale);
+            }
             time_per_byte
         } else {
             0.0
@@ -568,7 +591,9 @@ pub fn main() {
             let mut output = maybe_open(options.plot, op.name, "per-arg.log");
             let time_per_arg = time_per_arg(&mut a, op, &mut *output);
             println!("   time: per-arg: {time_per_arg:.2}ns");
-            println!("   cost: per-arg: {:.0}", time_per_arg * arg_cost_scale);
+            if let Some(cost_scale) = options.cost_factor {
+                println!("   cost: per-arg: {:.0}", time_per_arg * cost_scale);
+            }
             time_per_arg
         } else {
             0.0
@@ -578,14 +603,18 @@ pub fn main() {
             write_gnuplot_header(&mut *gnuplot, op, "base", "num nested calls");
             let base_call_time = base_call_time(&mut a, op, time_per_arg, &mut *output);
             println!("   time: base: {base_call_time:.2}ns");
-            println!("   cost: base: {:.0}", base_call_time * base_cost_scale);
+            if let Some(cost_scale) = options.cost_factor {
+                println!("   cost: base: {:.0}", base_call_time * cost_scale);
+            }
 
             print_plot(&mut *gnuplot, &base_call_time, &0.0, op.name, "base");
             base_call_time
         } else {
             let base_call_time = base_call_time_no_nest(&mut a, op, time_per_arg);
             println!("   time: base: {base_call_time:.2}ns");
-            println!("   cost: base: {:.0}", base_call_time * base_cost_scale);
+            if let Some(cost_scale) = options.cost_factor {
+                println!("   cost: base: {:.0}", base_call_time * cost_scale);
+            }
             base_call_time
         };