From 49c4dff8c9caa8e549165324953d90f6b6444ec4 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 10:41:08 -0400
Subject: [PATCH 01/24] Add cross-library 1D interpolation benchmark
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Compares the cached `Auto(t_props)` PR (DataInterpolations) against
Interpolations.jl, Dierckx.jl, BasicInterpolators.jl, and PCHIPInterpolation.jl
across construction, single-query, sorted batch, random batch, and chained
ODE-style workloads at n ∈ {100, 1k, 10k, 100k}, m ∈ {1, 10, 1k, 100k}.

Key results (full numbers in `bench/cross_library_comparison.md`):
- DI's sorted-batch + cached Auto wins ~1700-1900× vs Dierckx on Linear/Cubic
  at n=100k m=100k; loses to Interpolations(uniform) by ~16% on cubic because
  the latter uses O(1) uniform-grid lookup.
- Chained ODE-style at n=100k m=1000: DI beats Dierckx by ~450× and
  PCHIP by ~2× on monotone cubic; this is the workload iguesser was built for.
- DI CubicHermite beats PCHIPInterpolation on every batched cell (~2-5×).
- DI QuadraticSpline is the only consistent loser: O(n²) constructor
  (7s at n=100k vs Dierckx 14ms) and evaluators ~2-5× slower than Dierckx.
  Root cause is the linear-scan findfirst in `spline_coefficients!`.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 bench/.gitignore                  |   1 +
 bench/Project.toml                |   7 +
 bench/cross_library_comparison.jl | 664 ++++++++++++++++++++++++++++++
 bench/cross_library_comparison.md | 279 +++++++++++++
 4 files changed, 951 insertions(+)
 create mode 100644 bench/.gitignore
 create mode 100644 bench/Project.toml
 create mode 100644 bench/cross_library_comparison.jl
 create mode 100644 bench/cross_library_comparison.md

diff --git a/bench/.gitignore b/bench/.gitignore
new file mode 100644
index 00000000..ba39cc53
--- /dev/null
+++ b/bench/.gitignore
@@ -0,0 +1 @@
+Manifest.toml
diff --git a/bench/Project.toml b/bench/Project.toml
new file mode 100644
index 00000000..ba5ab73c
--- /dev/null
+++ b/bench/Project.toml
@@ -0,0 +1,7 @@
+[deps]
+BasicInterpolators = "26cce99e-4866-4b6d-ab74-862489e035e0"
+BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
+DataInterpolations = "82cc6244-b520-54b8-b5a6-8a565e85f1d0"
+Dierckx = "39dd38d3-220a-591b-8e3c-4c3a8c710a94"
+Interpolations = "a98d9a8b-a2ab-59e6-89dd-64a1c18fca59"
+PCHIPInterpolation = "afe20452-48d1-4729-9a8b-50fb251f06cd"
diff --git a/bench/cross_library_comparison.jl b/bench/cross_library_comparison.jl
new file mode 100644
index 00000000..20eb149e
--- /dev/null
+++ b/bench/cross_library_comparison.jl
@@ -0,0 +1,664 @@
+#=
+Cross-library 1D interpolation benchmark for DataInterpolations.jl.
+
+Compares DataInterpolations.jl (PR #529 branch, with cached Auto(t_props)) against
+Interpolations.jl, Dierckx.jl, BasicInterpolators.jl, and PCHIPInterpolation.jl.
+
+Usage:
+    julia +1.11 --project=bench bench/cross_library_comparison.jl
+
+The script writes a fresh `bench/cross_library_comparison.md` with the report.
+=#
+
+import Pkg
+const BENCH_DIR = @__DIR__
+const REPO_ROOT = dirname(BENCH_DIR)
+Pkg.activate(BENCH_DIR)
+
+using Printf
+using Random
+using Statistics
+using BenchmarkTools
+using LinearAlgebra
+using InteractiveUtils: versioninfo
+
+using DataInterpolations
+using Interpolations
+using Dierckx
+using BasicInterpolators
+using PCHIPInterpolation
+
+const DI = DataInterpolations
+const ITP = Interpolations
+const DRX = Dierckx
+const BI = BasicInterpolators
+const PCHIP = PCHIPInterpolation
+
+const RNG = MersenneTwister(0x00C0FFEE)
+
+# -----------------------------------------------------------------------------
+# Helpers
+# -----------------------------------------------------------------------------
+
+"""
+Build the test data `(u, t)` of length `n`. `pattern` is `:uniform` or `:nonuniform`.
+The samples are deterministic for a given (n, pattern).
+"""
+function make_knots(n::Int, pattern::Symbol)
+    rng = MersenneTwister(0x0BADBEEF + n + (pattern === :uniform ? 0 : 1))
+    if pattern === :uniform
+        # Keep as a `range` so Interpolations.cubic_spline_interpolation accepts it.
+        # Concrete Vector form for libraries that need it is taken via `collect(t)` later.
+        t = range(0.0, 1.0; length = n)
+    elseif pattern === :nonuniform
+        t = sort(rand(rng, n))
+        t .= (t .- first(t)) ./ (last(t) - first(t))
+    else
+        error("unknown pattern $(pattern)")
+    end
+    u = @. sin(2π * t) + 0.3 * cos(7 * t)
+    return u, t
+end
+
+"""
+Build a query batch of length `m` in the same domain. `pattern` is `:sorted`,
+`:random`, or `:chained` (monotone, ODE-style).
+"""
+function make_queries(m::Int, pattern::Symbol)
+    rng = MersenneTwister(0x00C0FFEE + m + (pattern === :sorted ? 0 : pattern === :random ? 1 : 2))
+    if pattern === :sorted
+        tt = sort(rand(rng, m))
+    elseif pattern === :random
+        tt = rand(rng, m)
+    elseif pattern === :chained
+        steps = rand(rng, m)
+        tt = cumsum(steps)
+        tt .= (tt .- first(tt)) ./ (last(tt) - first(tt)) .* 0.999 .+ 0.0005
+    else
+        error("unknown query pattern $(pattern)")
+    end
+    return tt
+end
+
+# Pretty-print BenchmarkTools.Trial median and IQR (q3-q1) in human units
+function fmt_trial(t::BenchmarkTools.Trial)
+    med = median(t).time # ns
+    q1 = quantile(t.times, 0.25)
+    q3 = quantile(t.times, 0.75)
+    iqr = q3 - q1
+    return string(BenchmarkTools.prettytime(med), " (IQR ", BenchmarkTools.prettytime(iqr), ")")
+end
+
+fmt_trial(::Nothing) = "—"
+
+# Result store: Dict{(algorithm, case, library) => Dict{params => Trial}}
+# We'll just use nested dictionaries to keep it simple
+const RESULTS = Dict{String, Any}()
+
+function record!(category::String, algo::String, lib::String, params::String, trial)
+    key = string(category, " | ", algo)
+    d = get!(RESULTS, key, Dict{Tuple{String, String}, Any}())
+    d[(lib, params)] = trial
+    return nothing
+end
+
+# Limit each individual benchmark; full sweep is large.
+const BMK_SECONDS = 0.5
+const BMK_SAMPLES = 100
+
+function bench(expr_setup::Function, args...; seconds = BMK_SECONDS, samples = BMK_SAMPLES)
+    b = @benchmarkable $(expr_setup)($(args)...) evals = 1 samples = samples seconds = seconds
+    return run(b)
+end
+
+# -----------------------------------------------------------------------------
+# Library adapter functions
+#
+# Each adapter returns the interpolator for the given (u, t).
+# We separate construction from evaluation so we can benchmark each.
+# -----------------------------------------------------------------------------
+
+# --- Linear --------------------------------------------------------------
+# Helpers: many third-party libraries want `Vector{Float64}` knots, not a `range`.
+_vec(t) = collect(Float64, t)
+
+build_di_linear(u, t) = DI.LinearInterpolation(_vec(u), _vec(t))
+build_itp_linear_uniform(u, t) = ITP.linear_interpolation(t, u) # t may be a range
+build_itp_linear_nonuniform(u, t) = ITP.interpolate((_vec(t),), _vec(u), ITP.Gridded(ITP.Linear()))
+build_drx_linear(u, t) = DRX.Spline1D(_vec(t), _vec(u); k = 1, bc = "extrapolate")
+build_bi_linear(u, t) = BI.LinearInterpolator(_vec(t), _vec(u), BI.WeakBoundaries())
+
+# --- Cubic spline (natural BC for DI, Interpolations) --------------------
+build_di_cubic(u, t) = DI.CubicSpline(_vec(u), _vec(t))
+build_itp_cubic_uniform(u, t) = ITP.cubic_spline_interpolation(t, u)
+build_drx_cubic(u, t) = DRX.Spline1D(_vec(t), _vec(u); k = 3, bc = "extrapolate")
+build_bi_cubic(u, t) = BI.CubicSplineInterpolator(_vec(t), _vec(u), BI.WeakBoundaries())
+
+# --- Quadratic spline ----------------------------------------------------
+build_di_quadratic(u, t) = DI.QuadraticSpline(_vec(u), _vec(t))
+build_drx_quadratic(u, t) = DRX.Spline1D(_vec(t), _vec(u); k = 2, bc = "extrapolate")
+
+# --- Akima ---------------------------------------------------------------
+build_di_akima(u, t) = DI.AkimaInterpolation(_vec(u), _vec(t))
+
+# --- PCHIP / monotone cubic Hermite -------------------------------------
+function build_di_cubic_hermite(u, t)
+    uv = _vec(u)
+    tv = _vec(t)
+    n = length(tv)
+    du = similar(uv)
+    @inbounds for i in 2:(n - 1)
+        du[i] = (uv[i + 1] - uv[i - 1]) / (tv[i + 1] - tv[i - 1])
+    end
+    du[1] = (uv[2] - uv[1]) / (tv[2] - tv[1])
+    du[n] = (uv[n] - uv[n - 1]) / (tv[n] - tv[n - 1])
+    return DI.CubicHermiteSpline(du, uv, tv)
+end
+build_pchip(u, t) = PCHIP.Interpolator(_vec(t), _vec(u))
+
+# --- Single-eval dispatch -----------------------------------------------
+# DI, Dierckx, BasicInterpolators all use `A(x)`
+# Interpolations also uses `A(x)`
+# PCHIP uses `A(x)`
+single_eval(A, x) = A(x)
+
+# --- Batched eval --------------------------------------------------------
+# DI: `A(out, tt)` in-place; uses sorted-batch fast path when sorted.
+batched_eval_di!(out, A, tt) = A(out, tt)
+# Interpolations: broadcast (no native batched call)
+batched_eval_itp!(out, A, tt) = (out .= A.(tt); out)
+# Dierckx: has Spline1D batched evaluation (returns a new array). We'll call the
+# in-place form if we can find it; otherwise wrap broadcast.
+batched_eval_drx!(out, A::DRX.Spline1D, tt) = (out .= DRX.evaluate.(Ref(A), tt); out)
+# BasicInterpolators: broadcast
+batched_eval_bi!(out, A, tt) = (out .= A.(tt); out)
+# PCHIP: broadcast
+batched_eval_pchip!(out, A, tt) = (out .= A.(tt); out)
+
+# -----------------------------------------------------------------------------
+# Verification: every library should agree on the same query to within tol
+# -----------------------------------------------------------------------------
+
+function verify_agreement(algo, builders, u, t, tt; tol = 1.0e-6, ref_name = first(keys(builders)))
+    ref_build = builders[ref_name]
+    ref = ref_build(u, t)
+    ref_vals = [single_eval(ref, x) for x in tt]
+    for (name, build) in builders
+        name == ref_name && continue
+        A = build(u, t)
+        vals = [single_eval(A, x) for x in tt]
+        diff = maximum(abs.(ref_vals .- vals))
+        if diff > tol
+            @warn "Library $name disagrees with $ref_name on $algo by max diff $diff (tol=$tol)"
+        end
+    end
+    return nothing
+end
+
+# -----------------------------------------------------------------------------
+# Run sweep
+# -----------------------------------------------------------------------------
+
+const SMOKE = get(ENV, "BENCH_SMOKE", "0") != "0"
+
+const N_VALUES = SMOKE ? [100, 1_000] : [100, 1_000, 10_000, 100_000]
+const M_VALUES = SMOKE ? [10, 1_000] : [1, 10, 1_000, 100_000]
+const KNOT_PATTERNS = [:uniform, :nonuniform]
+
+# Algorithm spec:
+#   builders :: Dict{library => build_fun(u, t)}
+#   batched! :: Dict{library => (out, A, tt) -> ...}
+#   supports :: Dict{library => set of knot_patterns it supports}
+const ALGORITHMS = let
+    d = Dict{String, NamedTuple}()
+    d["Linear"] = (
+        builders = Dict(
+            "DataInterpolations" => build_di_linear,
+            "Interpolations (uniform)" => build_itp_linear_uniform,
+            "Interpolations (gridded)" => build_itp_linear_nonuniform,
+            "Dierckx (k=1)" => build_drx_linear,
+            "BasicInterpolators" => build_bi_linear,
+        ),
+        batched! = Dict(
+            "DataInterpolations" => batched_eval_di!,
+            "Interpolations (uniform)" => batched_eval_itp!,
+            "Interpolations (gridded)" => batched_eval_itp!,
+            "Dierckx (k=1)" => batched_eval_drx!,
+            "BasicInterpolators" => batched_eval_bi!,
+        ),
+        supports = Dict(
+            "DataInterpolations" => [:uniform, :nonuniform],
+            "Interpolations (uniform)" => [:uniform],
+            "Interpolations (gridded)" => [:uniform, :nonuniform],
+            "Dierckx (k=1)" => [:uniform, :nonuniform],
+            "BasicInterpolators" => [:uniform, :nonuniform],
+        ),
+    )
+    d["CubicSpline"] = (
+        builders = Dict(
+            "DataInterpolations" => build_di_cubic,
+            "Interpolations (uniform)" => build_itp_cubic_uniform,
+            "Dierckx (k=3)" => build_drx_cubic,
+            "BasicInterpolators" => build_bi_cubic,
+        ),
+        batched! = Dict(
+            "DataInterpolations" => batched_eval_di!,
+            "Interpolations (uniform)" => batched_eval_itp!,
+            "Dierckx (k=3)" => batched_eval_drx!,
+            "BasicInterpolators" => batched_eval_bi!,
+        ),
+        supports = Dict(
+            "DataInterpolations" => [:uniform, :nonuniform],
+            "Interpolations (uniform)" => [:uniform],
+            "Dierckx (k=3)" => [:uniform, :nonuniform],
+            "BasicInterpolators" => [:uniform, :nonuniform],
+        ),
+    )
+    d["QuadraticSpline"] = (
+        builders = Dict(
+            "DataInterpolations" => build_di_quadratic,
+            "Dierckx (k=2)" => build_drx_quadratic,
+        ),
+        batched! = Dict(
+            "DataInterpolations" => batched_eval_di!,
+            "Dierckx (k=2)" => batched_eval_drx!,
+        ),
+        supports = Dict(
+            "DataInterpolations" => [:uniform, :nonuniform],
+            "Dierckx (k=2)" => [:uniform, :nonuniform],
+        ),
+    )
+    d["Akima"] = (
+        builders = Dict("DataInterpolations" => build_di_akima),
+        batched! = Dict("DataInterpolations" => batched_eval_di!),
+        supports = Dict("DataInterpolations" => [:uniform, :nonuniform]),
+    )
+    d["MonotoneCubic"] = (
+        builders = Dict(
+            "DataInterpolations (CubicHermite)" => build_di_cubic_hermite,
+            "PCHIPInterpolation" => build_pchip,
+        ),
+        batched! = Dict(
+            "DataInterpolations (CubicHermite)" => batched_eval_di!,
+            "PCHIPInterpolation" => batched_eval_pchip!,
+        ),
+        supports = Dict(
+            "DataInterpolations (CubicHermite)" => [:uniform, :nonuniform],
+            "PCHIPInterpolation" => [:uniform, :nonuniform],
+        ),
+    )
+    d
+end
+
+# Quick agreement check (use small n)
+function run_agreement_checks()
+    println("\n== Cross-library agreement check ==")
+    tt_check = collect(range(0.05, 0.95; length = 11))
+    for knot in (:uniform, :nonuniform)
+        u, t = make_knots(50, knot)
+        for (algo, spec) in ALGORITHMS
+            # Filter builders that support this knot pattern
+            supported = Dict(k => v for (k, v) in spec.builders if knot in spec.supports[k])
+            length(supported) < 2 && continue
+            # Different algorithms can disagree slightly (different BCs). We use
+            # a moderately loose tolerance only meant to catch outright bugs.
+            tol = algo == "Linear" ? 1.0e-10 : (algo in ("CubicSpline", "QuadraticSpline") ? 5.0e-2 : 1.0e-1)
+            try
+                verify_agreement(algo, supported, u, t, tt_check; tol = tol)
+            catch e
+                @warn "Agreement check failed: $algo $knot" exception = (e, catch_backtrace())
+            end
+        end
+    end
+    return nothing
+end
+
+# -----------------------------------------------------------------------------
+# Bench cases
+# -----------------------------------------------------------------------------
+
+function warmup()
+    # Force compilation of every builder + dispatch path so the actual benchmarks
+    # measure work, not first-time compile.
+    println("Warming up…")
+    for knot in KNOT_PATTERNS
+        u, t = make_knots(100, knot)
+        tt = make_queries(8, :sorted)
+        out = similar(tt)
+        for (_algo, spec) in ALGORITHMS
+            for (lib, build) in spec.builders
+                knot in spec.supports[lib] || continue
+                A = try
+                    build(u, t)
+                catch
+                    continue
+                end
+                single_eval(A, 0.5)
+                try
+                    spec.batched![lib](out, A, tt)
+                catch
+                end
+            end
+        end
+    end
+    return nothing
+end
+
+function run_construction()
+    println("\n== Construction time ==")
+    for (algo, spec) in ALGORITHMS
+        for n in N_VALUES
+            for knot in KNOT_PATTERNS
+                u, t = make_knots(n, knot)
+                for (lib, build) in spec.builders
+                    knot in spec.supports[lib] || continue
+                    trial = try
+                        bench(build, u, t)
+                    catch e
+                        @warn "construction failed: $algo $lib n=$n knot=$knot" exception = e
+                        nothing
+                    end
+                    record!(
+                        "construction", algo, lib,
+                        string("n=", n, ",", knot),
+                        trial,
+                    )
+                    println(
+                        @sprintf(
+                            "  %-25s | %-30s | n=%-7d | %s | %s",
+                            algo, lib, n, String(knot), fmt_trial(trial)
+                        )
+                    )
+                end
+            end
+        end
+    end
+    return nothing
+end
+
+function run_single_query()
+    println("\n== Single-query latency ==")
+    x_query = 0.42718
+    for (algo, spec) in ALGORITHMS
+        for n in N_VALUES
+            for knot in KNOT_PATTERNS
+                u, t = make_knots(n, knot)
+                for (lib, build) in spec.builders
+                    knot in spec.supports[lib] || continue
+                    A = try
+                        build(u, t)
+                    catch e
+                        @warn "skipping single-query (build failed): $algo $lib n=$n" exception = e
+                        continue
+                    end
+                    trial = try
+                        bench(single_eval, A, x_query)
+                    catch e
+                        @warn "single-query failed: $algo $lib" exception = e
+                        nothing
+                    end
+                    record!(
+                        "single-query", algo, lib,
+                        string("n=", n, ",", knot),
+                        trial,
+                    )
+                    println(
+                        @sprintf(
+                            "  %-25s | %-30s | n=%-7d | %s | %s",
+                            algo, lib, n, String(knot), fmt_trial(trial)
+                        )
+                    )
+                end
+            end
+        end
+    end
+    return nothing
+end
+
+# For batched/random/chained, we hold n at a single representative knot pattern
+# (uniform) — exploring the cross-product of n × knot-pattern × m × query-pattern
+# would explode the runtime. The batched-call story is the same on non-uniform
+# (DI's sorted fast-path still kicks in).
+
+function run_batched(query_pattern::Symbol, m_values = M_VALUES)
+    label = query_pattern === :sorted ? "Sorted batch" :
+        query_pattern === :random ? "Random batch" :
+        "Chained ODE-style"
+    println("\n== $label ==")
+    knot = :uniform
+    for (algo, spec) in ALGORITHMS
+        for n in N_VALUES
+            u, t = make_knots(n, knot)
+            for m in m_values
+                tt = make_queries(m, query_pattern)
+                for (lib, build) in spec.builders
+                    knot in spec.supports[lib] || continue
+                    A = try
+                        build(u, t)
+                    catch e
+                        continue
+                    end
+                    out = similar(tt)
+                    batched! = spec.batched![lib]
+                    if query_pattern === :chained
+                        # Sequential single-eval loop is what ODE solvers do.
+                        # Don't use the batched interface for this case.
+                        f = (A, tt) -> begin
+                            s = 0.0
+                            for x in tt
+                                s += single_eval(A, x)
+                            end
+                            s
+                        end
+                        trial = try
+                            bench(f, A, tt)
+                        catch e
+                            @warn "chained eval failed: $algo $lib" exception = e
+                            nothing
+                        end
+                    else
+                        trial = try
+                            bench(batched!, out, A, tt)
+                        catch e
+                            @warn "batched eval failed: $algo $lib" exception = e
+                            nothing
+                        end
+                    end
+                    record!(
+                        string(label), algo, lib,
+                        string("n=", n, ",m=", m),
+                        trial,
+                    )
+                    println(
+                        @sprintf(
+                            "  %-25s | %-30s | n=%-7d | m=%-7d | %s",
+                            algo, lib, n, m, fmt_trial(trial)
+                        )
+                    )
+                end
+            end
+        end
+    end
+    return nothing
+end
+
+# -----------------------------------------------------------------------------
+# Markdown output
+# -----------------------------------------------------------------------------
+
+function library_order(libs)
+    # Stable order: DI first, then others alphabetically
+    di = filter(l -> startswith(l, "DataInterpolations"), libs)
+    others = sort(setdiff(libs, di))
+    return vcat(sort(di), others)
+end
+
+function unique_params(d)
+    return sort!(unique([p for ((_, p), _) in d]))
+end
+
+function unique_libs(d)
+    return sort!(unique([l for ((l, _), _) in d]))
+end
+
+function write_table(io::IO, key::AbstractString, d::Dict)
+    libs = library_order(unique_libs(d))
+    params = unique_params(d)
+    print(io, "\n### ", key, "\n\n")
+    # Header
+    print(io, "| Library | ")
+    for p in params
+        print(io, p, " | ")
+    end
+    print(io, "\n")
+    print(io, "|---|")
+    for _ in params
+        print(io, "---|")
+    end
+    print(io, "\n")
+    for lib in libs
+        print(io, "| ", lib, " | ")
+        for p in params
+            trial = get(d, (lib, p), nothing)
+            print(io, fmt_trial(trial), " | ")
+        end
+        print(io, "\n")
+    end
+    return nothing
+end
+
+function write_report(path::String; total_seconds = 0.0)
+    open(path, "w") do io
+        println(io, "# Cross-library 1D interpolation benchmark")
+        println(io)
+        println(io, "## Setup")
+        println(io)
+        # Host/Julia info
+        println(io, "```")
+        io_buf = IOBuffer()
+        versioninfo(io_buf)
+        print(io, String(take!(io_buf)))
+        println(io, "```")
+        println(io)
+        println(io, "Bench harness: `BenchmarkTools.@benchmark` with `evals=1`, max samples=$(BMK_SAMPLES), max seconds=$(BMK_SECONDS).")
+        println(io)
+        commit = read(`git -C $REPO_ROOT rev-parse HEAD`, String) |> strip
+        println(io, "Commit: `$commit`")
+        println(io)
+        println(io, "Library versions:")
+        println(io, "```")
+        deps = Pkg.project().dependencies
+        all_info = Pkg.dependencies()
+        for pkg in ("DataInterpolations", "Interpolations", "Dierckx", "BasicInterpolators", "PCHIPInterpolation", "BenchmarkTools")
+            if haskey(deps, pkg)
+                v = all_info[deps[pkg]].version
+                println(io, "  ", pkg, " ", v)
+            end
+        end
+        println(io, "```")
+        println(io)
+        println(io, "Total bench time: ", round(total_seconds; digits = 1), " s")
+        println(io)
+
+        # Section 1: construction
+        println(io, "## Construction time")
+        println(io)
+        println(io, "Rows = library, columns = (n, knot pattern). Values = median wall time (IQR).")
+        for key in sort!(collect(keys(RESULTS)))
+            startswith(key, "construction") || continue
+            algo = split(key, " | ")[2]
+            write_table(io, algo, RESULTS[key])
+        end
+
+        # Section 2: single-query latency
+        println(io, "\n## Single-query latency")
+        println(io)
+        println(io, "Cold single evaluation `A(x_query)`. Rows = library, columns = (n, knot pattern).")
+        for key in sort!(collect(keys(RESULTS)))
+            startswith(key, "single-query") || continue
+            algo = split(key, " | ")[2]
+            write_table(io, algo, RESULTS[key])
+        end
+
+        # Section 3: sorted batch
+        println(io, "\n## Sorted batch")
+        println(io)
+        println(io, "`A(out, tt)` where `tt` is sorted random points in domain. (knot pattern = uniform)")
+        for key in sort!(collect(keys(RESULTS)))
+            startswith(key, "Sorted batch") || continue
+            algo = split(key, " | ")[2]
+            write_table(io, algo, RESULTS[key])
+        end
+
+        # Section 4: random batch
+        println(io, "\n## Random batch")
+        println(io)
+        println(io, "`A(out, tt)` where `tt` is unsorted. (knot pattern = uniform)")
+        for key in sort!(collect(keys(RESULTS)))
+            startswith(key, "Random batch") || continue
+            algo = split(key, " | ")[2]
+            write_table(io, algo, RESULTS[key])
+        end
+
+        # Section 5: chained
+        println(io, "\n## Chained ODE-style")
+        println(io)
+        println(io, "Sequential `for x in tt; A(x); end` over a monotone sequence. (knot pattern = uniform)")
+        for key in sort!(collect(keys(RESULTS)))
+            startswith(key, "Chained ODE-style") || continue
+            algo = split(key, " | ")[2]
+            write_table(io, algo, RESULTS[key])
+        end
+
+        println(io, "\n## Reproducer")
+        println(io)
+        println(io, "Bench script: `bench/cross_library_comparison.jl`")
+        println(io)
+        println(io, "Bench Project.toml: `bench/Project.toml` (devs DI from `..`).")
+        println(io)
+        println(
+            io,
+            """
+            To rerun:
+            ```bash
+            cd /home/crackauc/sandbox/tmp_20260515_091703_4914/DataInterpolations.jl
+            git checkout fff-strategy-batched-evals
+            julia +1.11 --project=bench bench/cross_library_comparison.jl
+            ```
+            """,
+        )
+    end
+    return nothing
+end
+
+# -----------------------------------------------------------------------------
+# Top-level
+# -----------------------------------------------------------------------------
+
+function main()
+    println("Starting cross-library benchmark sweep…")
+    println("Bench dir: ", BENCH_DIR)
+
+    t_start = time()
+
+    run_agreement_checks()
+    warmup()
+
+    run_construction()
+    run_single_query()
+    run_batched(:sorted)
+    run_batched(:random)
+    # Chained is most interesting at moderate m; cap to avoid 100k single-evals on Dierckx etc.
+    run_batched(:chained, [1_000])
+
+    t_end = time()
+    total = t_end - t_start
+    println("\nTotal bench time: ", round(total; digits = 1), " s")
+
+    report_path = joinpath(BENCH_DIR, "cross_library_comparison.md")
+    write_report(report_path; total_seconds = total)
+    println("Wrote report to ", report_path)
+    return nothing
+end
+
+main()
diff --git a/bench/cross_library_comparison.md b/bench/cross_library_comparison.md
new file mode 100644
index 00000000..b964581d
--- /dev/null
+++ b/bench/cross_library_comparison.md
@@ -0,0 +1,279 @@
+# Cross-library 1D interpolation benchmark
+
+## Setup
+
+```
+Julia Version 1.11.9
+Commit 53a02c0720c (2026-02-06 00:27 UTC)
+Build Info:
+  Official https://julialang.org/ release
+Platform Info:
+  OS: Linux (x86_64-linux-gnu)
+  CPU: 128 × AMD EPYC 7502 32-Core Processor
+  WORD_SIZE: 64
+  LLVM: libLLVM-16.0.6 (ORCJIT, znver2)
+Threads: 1 default, 0 interactive, 1 GC (on 128 virtual cores)
+```
+
+Bench harness: `BenchmarkTools.@benchmark` with `evals=1`, max samples=100, max seconds=0.5.
+
+Commit: `e22f5d6a6fa8d72079b33209b910b9504c4cadde`
+
+Library versions:
+```
+  DataInterpolations 8.10.0
+  Interpolations 0.16.2
+  Dierckx 0.5.4
+  BasicInterpolators 0.7.1
+  PCHIPInterpolation 0.2.1
+  BenchmarkTools 1.8.0
+```
+
+Total bench time: 353.5 s
+
+## Headline findings
+
+These numbers are taken directly from the tables below. All cells are medians from `BenchmarkTools.@benchmark evals=1` runs.
+
+- **Sorted-batch + cached `Auto(t_props)` is DI's biggest cross-library win.** At cubic spline n=100 000, m=100 000 (sorted batch, uniform knots), DI evaluates in **1.78 ms** vs Dierckx 3.16 s (~**1 770× faster**), BasicInterpolators 7.94 ms (~**4.5× faster**), and PCHIP at n=100k m=100k (sorted) 9.70 ms (~**5.3× faster** for monotone cubic). The only library that beats DI on this row is **Interpolations.jl's uniform constructor (2.06 ms, ~16% faster)** because it uses O(1) uniform-grid index lookup; DI still wins against every non-uniform-capable competitor. At linear n=100k m=100k sorted batch, DI is **1.64 ms** vs Dierckx 3.18 s (~**1 940×**) and BasicInterpolators 7.89 ms (~**4.8×**).
+
+- **`Auto(t_props)` also dominates the random / unsorted-batch case** because the cached search-property is re-used on every evaluation, not re-probed. At cubic n=100k m=100k *random* batch, DI is **6.87 ms** vs Dierckx 3.15 s (~**460×**), BasicInterpolators 19.8 ms (~**2.9×**); Interpolations(uniform) is still ahead at 2.06 ms (O(1) index). Even at random unsorted access, DI competes with — and on every non-uniform library beats — the alternatives.
+
+- **DI wins the chained ODE-style case decisively at large n.** Cubic spline, n=100k, m=1000 monotone chain: DI **69.6 μs** vs Dierckx 31.5 ms (~**450×**), BasicInterpolators 137 μs (~**2.0×**). MonotoneCubic chained, n=100k m=1000: DI 71.9 μs vs PCHIPInterpolation 149 μs (~**2.1×**). This is exactly the workload DI's `iguesser` was designed for; libraries without hint-chaining (Dierckx, BasicInterpolators, PCHIP) lose by ~2× to ~450×.
+
+- **Where DI loses on small m or single-eval:** single-query cubic at n=100k is 80 ns (DI) vs 50 ns (BasicInterpolators) and 70 ns (Interpolations uniform) — within ~1.5×, but consistently slightly slower because DI does a real index lookup whereas the others can use a one-shot uniform divide. At `sorted batch m=10 / n=10000` linear, DI is 500 ns vs Interpolations(uniform) 120 ns (4×) because DI's sorted-batch fast-path uses an O(m log n) per-element bisect plus allocates a small idx buffer; at this very small m the buffer alloc overhead dominates.
+
+- **DI QuadraticSpline is a clear loser, by ~2-5× across the board.** At n=100k construction DI takes **7.0 s** vs Dierckx 13.9 ms (~**500× slower**). At n=10k construction DI is 65.7 ms vs Dierckx 1.37 ms (~48×). Inspection traces this to `quadratic_spline_params` calling `spline_coefficients!` which does `findfirst(x -> x > u, k)` — a linear scan inside a loop over `n` knots, making the QuadraticSpline constructor **O(n²)**. The QuadraticSpline single-query at n=100k is also 60-110 μs (vs Dierckx 13-55 μs) and the batched evaluators at n=100k m=100k cost 7.0 s (vs Dierckx 3.2 s). This is the most actionable finding in the entire report.
+
+- **DI CubicHermiteSpline (used here as PCHIP analogue) beats PCHIPInterpolation.jl on every batched cell.** Sorted batch n=100k m=100k: DI 1.83 ms vs PCHIP 9.70 ms (~5.3×). Random batch n=100k m=100k: DI 7.28 ms vs PCHIP 20.4 ms (~2.8×). Chained n=100k m=1000: DI 72 μs vs PCHIP 149 μs (~2.1×). Construction is also slightly faster across all n.
+
+- **`Interpolations.jl`'s `cubic_spline_interpolation` / `linear_interpolation` over a `range` is the ceiling we're chasing on uniform data.** Because it does O(1) index lookup, it beats DI on every uniform-grid case where the lookup cost dominates: linear n=100k single-query 60 ns (DI 80 ns), linear sorted-batch n=100k m=100k 658 μs (DI 1.64 ms, ~2.5×), cubic sorted-batch n=100k m=100k 2.06 ms (DI 1.78 ms — DI wins here). It cannot handle non-uniform cubic at all; it falls back to `Gridded(Linear)` only. So the comparison is really "DI generalised to non-uniform & O(log n) lookup" vs "Interpolations specialised to uniform & O(1) lookup."
+
+## Construction time
+
+Rows = library, columns = (n, knot pattern). Values = median wall time (IQR).
+
+### Akima
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 2.195 μs (IQR 320.000 ns) | 2.285 μs (IQR 427.500 ns) | 31.189 μs (IQR 4.425 μs) | 44.820 μs (IQR 6.655 μs) | 117.964 μs (IQR 1.608 μs) | 182.268 μs (IQR 233.136 μs) | 1.203 ms (IQR 55.989 μs) | 1.269 ms (IQR 42.470 μs) | 
+
+### CubicSpline
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 7.450 μs (IQR 3.060 μs) | 6.880 μs (IQR 675.000 ns) | 56.620 μs (IQR 3.062 μs) | 60.729 μs (IQR 26.519 μs) | 507.370 μs (IQR 9.600 μs) | 580.565 μs (IQR 948.358 μs) | 5.510 ms (IQR 1.113 ms) | 5.229 ms (IQR 863.691 μs) | 
+| BasicInterpolators | 4.305 μs (IQR 542.500 ns) | 4.430 μs (IQR 475.000 ns) | 37.569 μs (IQR 2.132 μs) | 39.330 μs (IQR 4.598 μs) | 714.473 μs (IQR 401.371 μs) | 1.025 ms (IQR 714.324 μs) | 3.287 ms (IQR 894.667 μs) | 3.315 ms (IQR 848.164 μs) | 
+| Dierckx (k=3) | 17.674 μs (IQR 739.250 ns) | 17.600 μs (IQR 1.215 μs) | 208.738 μs (IQR 51.890 μs) | 212.863 μs (IQR 6.742 μs) | 1.608 ms (IQR 84.278 μs) | 1.745 ms (IQR 548.674 μs) | 17.461 ms (IQR 6.682 ms) | 18.954 ms (IQR 6.357 ms) | 
+| Interpolations (uniform) | — | 15.274 μs (IQR 734.250 ns) | — | 137.884 μs (IQR 19.681 μs) | — | 1.442 ms (IQR 464.458 μs) | — | 8.195 ms (IQR 134.718 μs) | 
+
+### Linear
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 1.260 μs (IQR 185.000 ns) | 1.450 μs (IQR 267.500 ns) | 10.200 μs (IQR 320.250 ns) | 11.110 μs (IQR 354.250 ns) | 92.584 μs (IQR 826.750 ns) | 101.064 μs (IQR 967.500 ns) | 930.192 μs (IQR 9.795 μs) | 998.760 μs (IQR 7.260 μs) | 
+| BasicInterpolators | 1.190 μs (IQR 212.500 ns) | 1.290 μs (IQR 235.000 ns) | 7.905 μs (IQR 505.000 ns) | 8.960 μs (IQR 1.292 μs) | 59.559 μs (IQR 1.714 μs) | 67.840 μs (IQR 1.940 μs) | 594.784 μs (IQR 9.875 μs) | 671.909 μs (IQR 10.883 μs) | 
+| Dierckx (k=1) | 11.919 μs (IQR 2.472 μs) | 12.485 μs (IQR 1.991 μs) | 79.025 μs (IQR 2.056 μs) | 108.474 μs (IQR 14.793 μs) | 790.987 μs (IQR 114.966 μs) | 1.019 ms (IQR 266.517 μs) | 7.557 ms (IQR 622.339 μs) | 7.581 ms (IQR 727.211 μs) | 
+| Interpolations (gridded) | 940.000 ns (IQR 162.500 ns) | 1.030 μs (IQR 222.500 ns) | 7.580 μs (IQR 537.250 ns) | 11.495 μs (IQR 10.139 μs) | 64.489 μs (IQR 977.500 ns) | 147.218 μs (IQR 76.435 μs) | 630.804 μs (IQR 14.617 μs) | 723.713 μs (IQR 18.942 μs) | 
+| Interpolations (uniform) | — | 215.000 ns (IQR 142.500 ns) | — | 3.204 μs (IQR 1.998 μs) | — | 22.045 μs (IQR 4.760 μs) | — | 75.369 μs (IQR 8.617 μs) | 
+
+### MonotoneCubic
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations (CubicHermite) | 1.400 μs (IQR 222.500 ns) | 1.545 μs (IQR 292.500 ns) | 10.195 μs (IQR 500.000 ns) | 11.000 μs (IQR 448.250 ns) | 87.144 μs (IQR 975.250 ns) | 94.999 μs (IQR 670.000 ns) | 868.637 μs (IQR 11.227 μs) | 953.866 μs (IQR 14.377 μs) | 
+| PCHIPInterpolation | 1.660 μs (IQR 420.000 ns) | 1.780 μs (IQR 452.500 ns) | 13.255 μs (IQR 960.500 ns) | 14.490 μs (IQR 1.624 μs) | 109.594 μs (IQR 1.990 μs) | 116.719 μs (IQR 1.327 μs) | 1.092 ms (IQR 21.902 μs) | 1.181 ms (IQR 35.152 μs) | 
+
+### QuadraticSpline
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 16.825 μs (IQR 904.250 ns) | 16.880 μs (IQR 865.750 ns) | 744.113 μs (IQR 19.005 μs) | 766.238 μs (IQR 39.012 μs) | 65.719 ms (IQR 401.579 μs) | 66.057 ms (IQR 689.417 μs) | 6.978 s (IQR 0.000 ns) | 7.028 s (IQR 0.000 ns) | 
+| Dierckx (k=2) | 18.560 μs (IQR 1.295 μs) | 17.700 μs (IQR 3.228 μs) | 137.524 μs (IQR 1.077 μs) | 175.948 μs (IQR 8.215 μs) | 1.371 ms (IQR 61.880 μs) | 1.583 ms (IQR 193.173 μs) | 13.906 ms (IQR 997.231 μs) | 13.571 ms (IQR 1.787 ms) | 
+
+## Single-query latency
+
+Cold single evaluation `A(x_query)`. Rows = library, columns = (n, knot pattern).
+
+### Akima
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 90.000 ns (IQR 10.000 ns) | 75.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 
+
+### CubicSpline
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 80.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 0.000 ns) | 
+| BasicInterpolators | 50.000 ns (IQR 0.000 ns) | 50.000 ns (IQR 0.000 ns) | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 0.000 ns) | 65.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 
+| Dierckx (k=3) | 160.000 ns (IQR 10.000 ns) | 160.000 ns (IQR 10.000 ns) | 390.000 ns (IQR 10.000 ns) | 400.000 ns (IQR 10.000 ns) | 2.780 μs (IQR 0.000 ns) | 2.790 μs (IQR 10.000 ns) | 26.750 μs (IQR 40.000 ns) | 26.650 μs (IQR 89.250 ns) | 
+| Interpolations (uniform) | — | 80.000 ns (IQR 10.000 ns) | — | 80.000 ns (IQR 10.000 ns) | — | 80.000 ns (IQR 0.000 ns) | — | 80.000 ns (IQR 10.000 ns) | 
+
+### Linear
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 0.000 ns) | 
+| BasicInterpolators | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 0.000 ns) | 
+| Dierckx (k=1) | 120.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 10.000 ns) | 350.000 ns (IQR 0.000 ns) | 370.000 ns (IQR 10.000 ns) | 2.760 μs (IQR 0.000 ns) | 2.770 μs (IQR 10.000 ns) | 26.729 μs (IQR 42.250 ns) | 26.630 μs (IQR 72.500 ns) | 
+| Interpolations (gridded) | 60.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 10.000 ns) | 
+| Interpolations (uniform) | — | 60.000 ns (IQR 0.000 ns) | — | 60.000 ns (IQR 0.000 ns) | — | 60.000 ns (IQR 0.000 ns) | — | 60.000 ns (IQR 0.000 ns) | 
+
+### MonotoneCubic
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations (CubicHermite) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 
+| PCHIPInterpolation | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 
+
+### QuadraticSpline
+
+| Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
+|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 180.000 ns (IQR 0.000 ns) | 190.000 ns (IQR 10.000 ns) | 660.000 ns (IQR 10.000 ns) | 710.000 ns (IQR 10.000 ns) | 5.810 μs (IQR 10.000 ns) | 5.820 μs (IQR 19.000 ns) | 62.569 μs (IQR 243.500 ns) | 62.474 μs (IQR 163.250 ns) | 
+| Dierckx (k=2) | 140.000 ns (IQR 0.000 ns) | 170.000 ns (IQR 32.500 ns) | 370.000 ns (IQR 0.000 ns) | 390.000 ns (IQR 0.000 ns) | 2.780 μs (IQR 10.000 ns) | 2.780 μs (IQR 10.000 ns) | 26.739 μs (IQR 73.250 ns) | 26.670 μs (IQR 59.000 ns) | 
+
+## Sorted batch
+
+`A(out, tt)` where `tt` is sorted random points in domain. (knot pattern = uniform)
+
+### Akima
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 110.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 10.000 ns) | 4.900 μs (IQR 1.530 μs) | 323.432 μs (IQR 2.525 μs) | 120.000 ns (IQR 0.000 ns) | 340.000 ns (IQR 10.000 ns) | 5.195 μs (IQR 30.000 ns) | 341.772 μs (IQR 1.866 μs) | 120.000 ns (IQR 10.000 ns) | 430.000 ns (IQR 10.000 ns) | 12.070 μs (IQR 412.500 ns) | 479.050 μs (IQR 9.502 μs) | 140.000 ns (IQR 10.000 ns) | 510.000 ns (IQR 10.000 ns) | 140.203 μs (IQR 1.752 μs) | 1.436 ms (IQR 26.067 μs) | 
+
+### CubicSpline
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 130.000 ns (IQR 10.000 ns) | 200.000 ns (IQR 10.000 ns) | 10.030 μs (IQR 20.000 ns) | 975.096 μs (IQR 13.203 μs) | 130.000 ns (IQR 0.000 ns) | 420.000 ns (IQR 10.000 ns) | 9.920 μs (IQR 20.000 ns) | 973.951 μs (IQR 22.567 μs) | 140.000 ns (IQR 10.000 ns) | 490.000 ns (IQR 10.000 ns) | 15.420 μs (IQR 50.000 ns) | 1.019 ms (IQR 9.423 μs) | 140.000 ns (IQR 10.000 ns) | 580.000 ns (IQR 10.000 ns) | 151.668 μs (IQR 4.980 μs) | 1.779 ms (IQR 21.049 μs) | 
+| BasicInterpolators | 70.000 ns (IQR 10.000 ns) | 180.000 ns (IQR 10.000 ns) | 16.315 μs (IQR 302.500 ns) | 1.369 ms (IQR 19.600 μs) | 70.000 ns (IQR 0.000 ns) | 240.000 ns (IQR 0.000 ns) | 42.385 μs (IQR 948.500 ns) | 2.034 ms (IQR 21.232 μs) | 70.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 10.000 ns) | 79.069 μs (IQR 1.113 μs) | 4.233 ms (IQR 66.511 μs) | 80.000 ns (IQR 0.000 ns) | 370.000 ns (IQR 10.000 ns) | 130.333 μs (IQR 2.495 μs) | 7.938 ms (IQR 43.734 μs) | 
+| Dierckx (k=3) | 190.000 ns (IQR 0.000 ns) | 1.220 μs (IQR 0.000 ns) | 121.929 μs (IQR 30.250 ns) | 11.761 ms (IQR 53.174 μs) | 710.000 ns (IQR 10.000 ns) | 3.620 μs (IQR 0.250 ns) | 408.796 μs (IQR 188.500 ns) | 41.214 ms (IQR 255.653 μs) | 5.710 μs (IQR 10.000 ns) | 26.890 μs (IQR 20.000 ns) | 3.210 ms (IQR 28.301 μs) | 323.867 ms (IQR 20.851 μs) | 55.660 μs (IQR 70.000 ns) | 260.212 μs (IQR 242.250 ns) | 31.300 ms (IQR 245.060 μs) | 3.157 s (IQR 0.000 ns) | 
+| Interpolations (uniform) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.469 μs (IQR 10.000 ns) | 2.050 ms (IQR 13.412 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.460 μs (IQR 1.000 ns) | 2.050 ms (IQR 13.490 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.460 μs (IQR 30.000 ns) | 2.050 ms (IQR 11.105 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.450 μs (IQR 20.000 ns) | 2.057 ms (IQR 21.207 μs) | 
+
+### Linear
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 120.000 ns (IQR 10.000 ns) | 180.000 ns (IQR 0.000 ns) | 5.830 μs (IQR 10.000 ns) | 469.835 μs (IQR 4.003 μs) | 120.000 ns (IQR 10.000 ns) | 380.000 ns (IQR 10.000 ns) | 6.210 μs (IQR 50.000 ns) | 485.851 μs (IQR 1.160 μs) | 120.000 ns (IQR 10.000 ns) | 450.000 ns (IQR 10.000 ns) | 15.390 μs (IQR 1.252 μs) | 629.649 μs (IQR 950.000 ns) | 130.000 ns (IQR 0.000 ns) | 540.000 ns (IQR 10.000 ns) | 141.224 μs (IQR 3.203 μs) | 1.644 ms (IQR 9.440 μs) | 
+| BasicInterpolators | 60.000 ns (IQR 0.000 ns) | 200.000 ns (IQR 0.000 ns) | 16.205 μs (IQR 350.250 ns) | 1.378 ms (IQR 13.425 μs) | 70.000 ns (IQR 10.000 ns) | 240.000 ns (IQR 0.000 ns) | 41.170 μs (IQR 2.439 μs) | 2.053 ms (IQR 9.387 μs) | 70.000 ns (IQR 10.000 ns) | 310.000 ns (IQR 0.000 ns) | 76.659 μs (IQR 3.703 μs) | 4.179 ms (IQR 15.650 μs) | 80.000 ns (IQR 0.000 ns) | 380.000 ns (IQR 10.000 ns) | 123.879 μs (IQR 2.312 μs) | 7.892 ms (IQR 63.663 μs) | 
+| Dierckx (k=1) | 150.000 ns (IQR 10.000 ns) | 850.000 ns (IQR 10.000 ns) | 87.719 μs (IQR 1.460 μs) | 8.265 ms (IQR 132.779 μs) | 670.000 ns (IQR 10.000 ns) | 3.280 μs (IQR 820.000 ns) | 373.336 μs (IQR 5.365 μs) | 37.651 ms (IQR 73.838 μs) | 5.660 μs (IQR 30.000 ns) | 26.730 μs (IQR 50.000 ns) | 3.168 ms (IQR 24.134 μs) | 319.511 ms (IQR 16.000 μs) | 55.640 μs (IQR 113.250 ns) | 261.808 μs (IQR 933.000 ns) | 31.246 ms (IQR 377.619 μs) | 3.186 s (IQR 0.000 ns) | 
+| Interpolations (gridded) | 70.000 ns (IQR 0.000 ns) | 230.000 ns (IQR 0.000 ns) | 18.250 μs (IQR 50.250 ns) | 1.635 ms (IQR 23.676 μs) | 70.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 0.000 ns) | 48.190 μs (IQR 3.190 μs) | 2.548 ms (IQR 41.645 μs) | 80.000 ns (IQR 0.000 ns) | 360.000 ns (IQR 10.000 ns) | 90.964 μs (IQR 3.175 μs) | 4.704 ms (IQR 63.885 μs) | 84.500 ns (IQR 10.000 ns) | 430.000 ns (IQR 0.000 ns) | 141.284 μs (IQR 2.475 μs) | 7.996 ms (IQR 40.135 μs) | 
+| Interpolations (uniform) | 60.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.610 μs (IQR 0.000 ns) | 655.124 μs (IQR 583.250 ns) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.600 μs (IQR 20.000 ns) | 655.409 μs (IQR 12.107 μs) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.670 μs (IQR 30.000 ns) | 655.644 μs (IQR 702.500 ns) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 7.060 μs (IQR 50.000 ns) | 658.249 μs (IQR 1.255 μs) | 
+
+### MonotoneCubic
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations (CubicHermite) | 130.000 ns (IQR 30.000 ns) | 340.000 ns (IQR 10.000 ns) | 10.490 μs (IQR 20.250 ns) | 988.671 μs (IQR 9.099 μs) | 140.000 ns (IQR 10.000 ns) | 420.000 ns (IQR 10.000 ns) | 10.649 μs (IQR 30.000 ns) | 989.491 μs (IQR 14.422 μs) | 140.000 ns (IQR 0.000 ns) | 500.000 ns (IQR 10.000 ns) | 19.150 μs (IQR 80.000 ns) | 1.067 ms (IQR 11.665 μs) | 150.000 ns (IQR 0.000 ns) | 580.000 ns (IQR 10.000 ns) | 146.929 μs (IQR 2.422 μs) | 1.825 ms (IQR 19.328 μs) | 
+| PCHIPInterpolation | 70.000 ns (IQR 10.000 ns) | 240.000 ns (IQR 0.000 ns) | 20.389 μs (IQR 437.500 ns) | 1.867 ms (IQR 24.703 μs) | 90.000 ns (IQR 0.000 ns) | 330.000 ns (IQR 0.000 ns) | 39.885 μs (IQR 881.750 ns) | 2.972 ms (IQR 17.169 μs) | 100.000 ns (IQR 0.000 ns) | 440.000 ns (IQR 10.000 ns) | 79.079 μs (IQR 4.630 μs) | 5.475 ms (IQR 51.462 μs) | 110.000 ns (IQR 0.000 ns) | 510.000 ns (IQR 10.000 ns) | 133.694 μs (IQR 4.237 μs) | 9.703 ms (IQR 97.707 μs) | 
+
+### QuadraticSpline
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 290.000 ns (IQR 10.000 ns) | 1.370 μs (IQR 0.000 ns) | 137.279 μs (IQR 811.750 ns) | 13.395 ms (IQR 177.476 μs) | 1.260 μs (IQR 0.000 ns) | 6.600 μs (IQR 12.250 ns) | 722.878 μs (IQR 1.238 μs) | 72.672 ms (IQR 365.231 μs) | 10.915 μs (IQR 30.000 ns) | 56.859 μs (IQR 70.000 ns) | 6.588 ms (IQR 72.728 μs) | 660.689 ms (IQR 0.000 ns) | 112.729 μs (IQR 162.500 ns) | 607.684 μs (IQR 7.387 μs) | 70.380 ms (IQR 419.419 μs) | 7.038 s (IQR 0.000 ns) | 
+| Dierckx (k=2) | 170.000 ns (IQR 0.000 ns) | 1.030 μs (IQR 10.000 ns) | 103.394 μs (IQR 260.000 ns) | 9.983 ms (IQR 106.786 μs) | 680.000 ns (IQR 10.000 ns) | 3.450 μs (IQR 10.000 ns) | 390.976 μs (IQR 1.002 μs) | 39.394 ms (IQR 210.678 μs) | 5.690 μs (IQR 13.250 ns) | 26.760 μs (IQR 20.000 ns) | 3.190 ms (IQR 47.677 μs) | 322.009 ms (IQR 65.414 μs) | 55.739 μs (IQR 115.000 ns) | 260.118 μs (IQR 761.500 ns) | 31.568 ms (IQR 621.605 μs) | 3.207 s (IQR 0.000 ns) | 
+
+## Random batch
+
+`A(out, tt)` where `tt` is unsorted. (knot pattern = uniform)
+
+### Akima
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 120.000 ns (IQR 10.000 ns) | 450.000 ns (IQR 0.000 ns) | 47.359 μs (IQR 171.500 ns) | 4.831 ms (IQR 31.837 μs) | 120.000 ns (IQR 0.000 ns) | 450.000 ns (IQR 0.000 ns) | 48.005 μs (IQR 194.750 ns) | 4.898 ms (IQR 32.682 μs) | 130.000 ns (IQR 10.000 ns) | 430.000 ns (IQR 10.000 ns) | 52.684 μs (IQR 263.500 ns) | 5.357 ms (IQR 57.461 μs) | 140.000 ns (IQR 10.000 ns) | 440.000 ns (IQR 10.000 ns) | 59.049 μs (IQR 342.500 ns) | 6.366 ms (IQR 52.595 μs) | 
+
+### CubicSpline
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 130.000 ns (IQR 10.000 ns) | 490.000 ns (IQR 10.000 ns) | 51.094 μs (IQR 95.500 ns) | 5.201 ms (IQR 58.934 μs) | 130.000 ns (IQR 0.000 ns) | 490.000 ns (IQR 0.000 ns) | 52.210 μs (IQR 255.000 ns) | 5.480 ms (IQR 26.636 μs) | 140.000 ns (IQR 0.000 ns) | 480.000 ns (IQR 0.000 ns) | 55.980 μs (IQR 354.750 ns) | 5.666 ms (IQR 48.039 μs) | 150.000 ns (IQR 10.000 ns) | 500.000 ns (IQR 10.000 ns) | 63.150 μs (IQR 3.263 μs) | 6.874 ms (IQR 47.719 μs) | 
+| BasicInterpolators | 70.000 ns (IQR 10.000 ns) | 190.000 ns (IQR 0.000 ns) | 28.160 μs (IQR 695.000 ns) | 6.444 ms (IQR 72.182 μs) | 70.000 ns (IQR 0.000 ns) | 240.000 ns (IQR 10.000 ns) | 69.590 μs (IQR 4.885 μs) | 10.042 ms (IQR 149.286 μs) | 70.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 0.000 ns) | 110.244 μs (IQR 3.438 μs) | 13.575 ms (IQR 158.219 μs) | 80.000 ns (IQR 0.000 ns) | 360.000 ns (IQR 0.000 ns) | 172.224 μs (IQR 7.392 μs) | 19.794 ms (IQR 117.482 μs) | 
+| Dierckx (k=3) | 150.000 ns (IQR 10.000 ns) | 1.260 μs (IQR 20.000 ns) | 134.564 μs (IQR 305.000 ns) | 13.506 ms (IQR 43.390 μs) | 280.000 ns (IQR 10.000 ns) | 3.950 μs (IQR 10.000 ns) | 412.066 μs (IQR 282.500 ns) | 41.346 ms (IQR 455.686 μs) | 1.490 μs (IQR 0.000 ns) | 30.060 μs (IQR 30.000 ns) | 3.247 ms (IQR 47.519 μs) | 323.084 ms (IQR 648.144 μs) | 13.470 μs (IQR 80.000 ns) | 291.452 μs (IQR 1.265 μs) | 31.720 ms (IQR 238.153 μs) | 3.151 s (IQR 0.000 ns) | 
+| Interpolations (uniform) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 10.000 ns) | 20.459 μs (IQR 10.000 ns) | 2.048 ms (IQR 8.437 μs) | 80.000 ns (IQR 10.000 ns) | 260.000 ns (IQR 10.000 ns) | 20.440 μs (IQR 52.500 ns) | 2.047 ms (IQR 13.848 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.430 μs (IQR 20.000 ns) | 2.049 ms (IQR 31.699 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.420 μs (IQR 20.000 ns) | 2.061 ms (IQR 28.078 μs) | 
+
+### Linear
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 130.000 ns (IQR 0.000 ns) | 520.000 ns (IQR 10.000 ns) | 55.089 μs (IQR 111.500 ns) | 5.582 ms (IQR 35.069 μs) | 120.000 ns (IQR 0.000 ns) | 510.000 ns (IQR 10.000 ns) | 55.030 μs (IQR 172.500 ns) | 5.565 ms (IQR 31.740 μs) | 130.000 ns (IQR 10.000 ns) | 480.000 ns (IQR 0.000 ns) | 56.074 μs (IQR 649.500 ns) | 5.687 ms (IQR 50.330 μs) | 130.000 ns (IQR 10.000 ns) | 480.000 ns (IQR 0.000 ns) | 58.300 μs (IQR 568.500 ns) | 6.744 ms (IQR 64.104 μs) | 
+| BasicInterpolators | 60.000 ns (IQR 0.000 ns) | 180.000 ns (IQR 10.000 ns) | 29.580 μs (IQR 1.822 μs) | 6.435 ms (IQR 41.382 μs) | 60.000 ns (IQR 10.000 ns) | 230.000 ns (IQR 0.000 ns) | 64.855 μs (IQR 3.784 μs) | 9.784 ms (IQR 57.275 μs) | 70.000 ns (IQR 0.000 ns) | 300.000 ns (IQR 10.000 ns) | 105.934 μs (IQR 1.353 μs) | 13.251 ms (IQR 76.569 μs) | 80.000 ns (IQR 10.000 ns) | 360.000 ns (IQR 10.000 ns) | 167.988 μs (IQR 8.889 μs) | 19.198 ms (IQR 179.439 μs) | 
+| Dierckx (k=1) | 110.000 ns (IQR 0.000 ns) | 880.000 ns (IQR 0.000 ns) | 103.619 μs (IQR 592.500 ns) | 10.349 ms (IQR 87.979 μs) | 250.000 ns (IQR 0.000 ns) | 3.600 μs (IQR 10.000 ns) | 377.267 μs (IQR 260.250 ns) | 37.624 ms (IQR 375.581 μs) | 1.450 μs (IQR 10.000 ns) | 29.650 μs (IQR 23.250 ns) | 3.191 ms (IQR 13.440 μs) | 318.772 ms (IQR 307.167 μs) | 13.470 μs (IQR 40.000 ns) | 291.407 μs (IQR 310.000 ns) | 31.660 ms (IQR 145.164 μs) | 3.181 s (IQR 0.000 ns) | 
+| Interpolations (gridded) | 70.000 ns (IQR 2.500 ns) | 230.000 ns (IQR 10.000 ns) | 21.320 μs (IQR 824.250 ns) | 6.593 ms (IQR 59.599 μs) | 70.000 ns (IQR 10.000 ns) | 290.000 ns (IQR 0.000 ns) | 57.594 μs (IQR 7.278 μs) | 10.134 ms (IQR 55.693 μs) | 100.000 ns (IQR 20.000 ns) | 350.000 ns (IQR 2.500 ns) | 101.449 μs (IQR 5.872 μs) | 13.761 ms (IQR 140.448 μs) | 90.000 ns (IQR 0.000 ns) | 400.000 ns (IQR 10.000 ns) | 166.308 μs (IQR 6.663 μs) | 19.858 ms (IQR 70.962 μs) | 
+| Interpolations (uniform) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 10.000 ns) | 6.560 μs (IQR 40.000 ns) | 655.544 μs (IQR 9.552 μs) | 60.000 ns (IQR 0.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.630 μs (IQR 11.000 ns) | 655.564 μs (IQR 8.735 μs) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.889 μs (IQR 10.000 ns) | 683.948 μs (IQR 4.087 μs) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 7.160 μs (IQR 10.000 ns) | 752.648 μs (IQR 1.765 μs) | 
+
+### MonotoneCubic
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations (CubicHermite) | 130.000 ns (IQR 10.000 ns) | 530.000 ns (IQR 0.000 ns) | 52.569 μs (IQR 80.000 ns) | 5.297 ms (IQR 17.295 μs) | 130.000 ns (IQR 10.000 ns) | 530.000 ns (IQR 10.000 ns) | 53.119 μs (IQR 119.500 ns) | 5.326 ms (IQR 26.192 μs) | 140.000 ns (IQR 10.000 ns) | 520.000 ns (IQR 10.000 ns) | 57.039 μs (IQR 395.000 ns) | 5.697 ms (IQR 20.677 μs) | 150.000 ns (IQR 0.000 ns) | 540.000 ns (IQR 10.000 ns) | 61.514 μs (IQR 244.750 ns) | 7.278 ms (IQR 31.449 μs) | 
+| PCHIPInterpolation | 80.000 ns (IQR 10.000 ns) | 240.000 ns (IQR 10.000 ns) | 24.865 μs (IQR 1.385 μs) | 6.407 ms (IQR 40.035 μs) | 100.000 ns (IQR 20.000 ns) | 340.000 ns (IQR 10.000 ns) | 65.279 μs (IQR 569.000 ns) | 9.842 ms (IQR 42.269 μs) | 90.000 ns (IQR 10.000 ns) | 440.000 ns (IQR 0.000 ns) | 117.314 μs (IQR 3.672 μs) | 14.126 ms (IQR 36.737 μs) | 110.000 ns (IQR 10.000 ns) | 480.000 ns (IQR 10.000 ns) | 182.258 μs (IQR 4.223 μs) | 20.388 ms (IQR 38.910 μs) | 
+
+### QuadraticSpline
+
+| Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
+|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
+| DataInterpolations | 230.000 ns (IQR 10.000 ns) | 1.650 μs (IQR 10.000 ns) | 169.573 μs (IQR 1.357 μs) | 17.094 ms (IQR 49.515 μs) | 540.000 ns (IQR 10.000 ns) | 7.080 μs (IQR 10.000 ns) | 750.153 μs (IQR 7.195 μs) | 74.773 ms (IQR 70.109 μs) | 3.630 μs (IQR 22.250 ns) | 62.340 μs (IQR 43.250 ns) | 6.627 ms (IQR 25.269 μs) | 669.475 ms (IQR 0.000 ns) | 39.715 μs (IQR 720.000 ns) | 663.894 μs (IQR 3.838 μs) | 70.311 ms (IQR 31.738 μs) | 7.058 s (IQR 0.000 ns) | 
+| Dierckx (k=2) | 130.000 ns (IQR 0.000 ns) | 1.060 μs (IQR 0.000 ns) | 116.774 μs (IQR 711.750 ns) | 11.700 ms (IQR 35.465 μs) | 270.000 ns (IQR 10.000 ns) | 3.790 μs (IQR 10.000 ns) | 394.467 μs (IQR 301.750 ns) | 39.408 ms (IQR 62.060 μs) | 1.480 μs (IQR 2.500 ns) | 29.880 μs (IQR 30.000 ns) | 3.209 ms (IQR 5.805 μs) | 320.457 ms (IQR 632.470 μs) | 13.500 μs (IQR 50.000 ns) | 291.127 μs (IQR 298.500 ns) | 31.489 ms (IQR 130.091 μs) | 3.195 s (IQR 0.000 ns) | 
+
+## Chained ODE-style
+
+Sequential `for x in tt; A(x); end` over a monotone sequence. (knot pattern = uniform)
+
+### Akima
+
+| Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
+|---|---|---|---|---|
+| DataInterpolations | 40.720 μs (IQR 21.000 ns) | 47.709 μs (IQR 51.000 ns) | 47.785 μs (IQR 129.250 ns) | 63.300 μs (IQR 381.500 ns) | 
+
+### CubicSpline
+
+| Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
+|---|---|---|---|---|
+| DataInterpolations | 46.169 μs (IQR 20.000 ns) | 52.069 μs (IQR 350.000 ns) | 52.645 μs (IQR 225.500 ns) | 69.550 μs (IQR 362.500 ns) | 
+| BasicInterpolators | 16.989 μs (IQR 459.250 ns) | 47.639 μs (IQR 1.077 μs) | 86.939 μs (IQR 2.837 μs) | 136.684 μs (IQR 2.812 μs) | 
+| Dierckx (k=3) | 122.399 μs (IQR 52.500 ns) | 409.806 μs (IQR 50.000 ns) | 3.212 ms (IQR 2.620 μs) | 31.457 ms (IQR 222.590 μs) | 
+| Interpolations (uniform) | 27.750 μs (IQR 600.000 ns) | 27.749 μs (IQR 499.250 ns) | 27.750 μs (IQR 1.179 μs) | 27.750 μs (IQR 440.000 ns) | 
+
+### Linear
+
+| Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
+|---|---|---|---|---|
+| DataInterpolations | 42.920 μs (IQR 10.000 ns) | 49.549 μs (IQR 130.250 ns) | 50.259 μs (IQR 159.250 ns) | 55.679 μs (IQR 428.000 ns) | 
+| BasicInterpolators | 17.259 μs (IQR 92.500 ns) | 44.764 μs (IQR 3.072 μs) | 82.629 μs (IQR 2.270 μs) | 132.393 μs (IQR 2.408 μs) | 
+| Dierckx (k=1) | 87.039 μs (IQR 70.000 ns) | 374.796 μs (IQR 415.500 ns) | 3.199 ms (IQR 48.275 μs) | 31.242 ms (IQR 56.158 μs) | 
+| Interpolations (gridded) | 23.920 μs (IQR 449.750 ns) | 58.344 μs (IQR 2.035 μs) | 87.894 μs (IQR 3.572 μs) | 141.208 μs (IQR 3.995 μs) | 
+| Interpolations (uniform) | 23.050 μs (IQR 21.000 ns) | 23.060 μs (IQR 30.000 ns) | 23.040 μs (IQR 50.000 ns) | 23.129 μs (IQR 40.000 ns) | 
+
+### MonotoneCubic
+
+| Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
+|---|---|---|---|---|
+| DataInterpolations (CubicHermite) | 50.009 μs (IQR 30.000 ns) | 54.480 μs (IQR 109.000 ns) | 53.984 μs (IQR 110.000 ns) | 71.909 μs (IQR 809.250 ns) | 
+| PCHIPInterpolation | 25.240 μs (IQR 300.000 ns) | 50.559 μs (IQR 934.000 ns) | 93.234 μs (IQR 1.728 μs) | 148.724 μs (IQR 7.090 μs) | 
+
+### QuadraticSpline
+
+| Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
+|---|---|---|---|---|
+| DataInterpolations | 163.768 μs (IQR 173.250 ns) | 743.168 μs (IQR 397.500 ns) | 6.613 ms (IQR 60.383 μs) | 70.305 ms (IQR 457.841 μs) | 
+| Dierckx (k=2) | 104.904 μs (IQR 220.000 ns) | 393.182 μs (IQR 351.000 ns) | 3.190 ms (IQR 1.820 μs) | 31.236 ms (IQR 63.944 μs) | 
+
+## Reproducer
+
+Bench script: `bench/cross_library_comparison.jl`
+
+Bench Project.toml: `bench/Project.toml` (devs DI from `..`).
+
+To rerun:
+```bash
+cd /home/crackauc/sandbox/tmp_20260515_091703_4914/DataInterpolations.jl
+git checkout fff-strategy-batched-evals
+julia +1.11 --project=bench bench/cross_library_comparison.jl
+```
+

From 4abc69a73b3393b5f5d62744899dd7bfe8fe820b Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 11:41:39 -0400
Subject: [PATCH 02/24] Drop the legacy linear_lookup / seems_linear /
 looks_linear machinery

`SearchProperties` (added per-cache in the previous commit) already runs
the same uniformity probe, so the parallel DI implementation is now pure
duplication. Removes:

  - `linear_lookup::Bool` field on every interpolation cache. The
    type-parameter list shrinks accordingly.
  - `seems_linear(assume_linear_t, t)` / `looks_linear(t; threshold)` in
    `interpolation_utils.jl`.
  - The `assume_linear_t` keyword from every constructor. (Breaking, but
    the PR is already a major refactor; `SearchProperties` runs the same
    probe automatically at construction with a 1e-3 default that matches
    FFF's `Auto` tolerance, and approximate-uniform vectors couldn't
    benefit from `UniformStep` anyway since that path needs exact-uniform
    spacing.)

`test/derivative_tests.jl`'s `func.iguesser.linear_lookup` check (which
gated the per-type chained-lookup invariant assertion to non-uniform
data) is rewritten as `!func.t_props.is_uniform`, the FFF-side
equivalent.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_caches.jl      | 227 +++++++++----------------------
 src/interpolation_utils.jl       |  23 ----
 test/Methods/derivative_tests.jl |   2 +-
 3 files changed, 63 insertions(+), 189 deletions(-)

diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index 0d12c3a6..107dfc7f 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -22,10 +22,6 @@ Extrapolation extends the last linear polynomial on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation
     computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behavior for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct LinearInterpolation{uType, tType, IType, pType, T, propsType} <:
     AbstractInterpolation{T}
@@ -38,19 +34,17 @@ struct LinearInterpolation{uType, tType, IType, pType, T, propsType} <:
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function LinearInterpolation(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            cache_parameters, assume_linear_t
+            cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.slope),
             eltype(u), typeof(t_props),
         }(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters, linear_lookup
+            Guesser(t), t_props, cache_parameters
         )
     end
 end
@@ -58,7 +52,7 @@ end
 function LinearInterpolation(
         u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false, assume_linear_t = 1.0e-2
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -68,12 +62,12 @@ function LinearInterpolation(
     p = LinearParameterCache(u, t, cache_parameters)
     A = LinearInterpolation(
         u, t, nothing, p, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return LinearInterpolation(
         u, t, I, p, extrapolation_left, extrapolation_right,
-        cache_parameters, assume_linear_t
+        cache_parameters
     )
 end
 
@@ -101,10 +95,6 @@ Extrapolation extends the last quadratic polynomial on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType} <:
     AbstractInterpolation{T}
@@ -118,21 +108,19 @@ struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType} <:
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function QuadraticInterpolation(
             u, t, I, p, mode, extrapolation_left,
-            extrapolation_right, cache_parameters, assume_linear_t
+            extrapolation_right, cache_parameters
         )
         mode ∈ (:Forward, :Backward) ||
             error("mode should be :Forward or :Backward for QuadraticInterpolation")
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α),
             eltype(u), typeof(t_props),
         }(
             u, t, I, p, mode, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters, linear_lookup
+            Guesser(t), t_props, cache_parameters
         )
     end
 end
@@ -140,23 +128,22 @@ end
 function QuadraticInterpolation(
         u, t, mode; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false, assume_linear_t = 1.0e-2
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
-    linear_lookup = seems_linear(assume_linear_t, t)
     p = QuadraticParameterCache(u, t, cache_parameters, mode)
     A = QuadraticInterpolation(
         u, t, nothing, p, mode, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return QuadraticInterpolation(
         u, t, I, p, mode, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -260,10 +247,6 @@ Extrapolation extends the last cubic polynomial on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct AkimaInterpolation{uType, tType, IType, bType, cType, dType, T, propsType} <:
     AbstractInterpolation{T}
@@ -278,12 +261,10 @@ struct AkimaInterpolation{uType, tType, IType, bType, cType, dType, T, propsType
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function AkimaInterpolation(
             u, t, I, b, c, d, extrapolation_left,
-            extrapolation_right, cache_parameters, assume_linear_t
+            extrapolation_right, cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(b), typeof(c),
@@ -300,7 +281,7 @@ struct AkimaInterpolation{uType, tType, IType, bType, cType, dType, T, propsType
             Guesser(t),
             t_props,
             cache_parameters,
-            linear_lookup
+
         )
     end
 end
@@ -369,14 +350,13 @@ function AkimaInterpolation(
         u, t; modified::Bool = false,
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false, assume_linear_t = 1.0e-2
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
-    linear_lookup = seems_linear(assume_linear_t, t)
     n = length(t)
     T = eltype(u)
     b = Vector{T}(undef, n)
@@ -386,12 +366,12 @@ function AkimaInterpolation(
 
     A = AkimaInterpolation(
         u, t, nothing, b, c, d, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return AkimaInterpolation(
         u, t, I, b, c, d, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -419,10 +399,6 @@ Extrapolation extends the last constant polynomial at the end points on each sid
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct ConstantInterpolation{uType, tType, IType, T, propsType} <:
     AbstractInterpolation{T}
@@ -436,16 +412,14 @@ struct ConstantInterpolation{uType, tType, IType, T, propsType} <:
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function ConstantInterpolation(
             u, t, I, dir, extrapolation_left, extrapolation_right,
-            cache_parameters, assume_linear_t
+            cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{typeof(u), typeof(t), typeof(I), eltype(u), typeof(t_props)}(
             u, t, I, nothing, dir, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters, linear_lookup
+            Guesser(t), t_props, cache_parameters
         )
     end
 end
@@ -454,7 +428,7 @@ function ConstantInterpolation(
         u, t; dir = :left, extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false, assume_linear_t = 1.0e-2
+        cache_parameters = false
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -463,18 +437,18 @@ function ConstantInterpolation(
     u, t = munge_data(u, t)
     A = ConstantInterpolation(
         u, t, nothing, dir, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return ConstantInterpolation(
         u, t, I, dir, extrapolation_left, extrapolation_right,
-        cache_parameters, assume_linear_t
+        cache_parameters
     )
 end
 
 """
     SmoothedConstantInterpolation(u, t; d_max = Inf, extrapolate = false,
-        cache_parameters = false, assume_linear_t = 1e-2)
+        cache_parameters = false)
 
 It is a method for interpolating constantly with forward fill, with smoothing around the
 value transitions to make the curve continuously differentiable while the integral never
@@ -498,10 +472,6 @@ except when using extrapolation types `Constant` or `Extension`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behavior for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct SmoothedConstantInterpolation{
         uType, tType, IType, dType, cType, dmaxType, T, propsType,
@@ -517,19 +487,17 @@ struct SmoothedConstantInterpolation{
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function SmoothedConstantInterpolation(
             u, t, I, p, d_max, extrapolation_left,
-            extrapolation_right, cache_parameters, assume_linear_t
+            extrapolation_right, cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.d),
             typeof(p.c), typeof(d_max), eltype(u), typeof(t_props),
         }(
             u, t, I, p, d_max, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters, linear_lookup
+            Guesser(t), t_props, cache_parameters
         )
     end
 end
@@ -538,7 +506,7 @@ function SmoothedConstantInterpolation(
         u, t; d_max = Inf, extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false, assume_linear_t = 1.0e-2
+        cache_parameters = false
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -550,12 +518,12 @@ function SmoothedConstantInterpolation(
     )
     A = SmoothedConstantInterpolation(
         u, t, nothing, p, d_max, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return SmoothedConstantInterpolation(
         u, t, I, p, d_max, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -581,10 +549,6 @@ Extrapolation extends the last quadratic polynomial on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct QuadraticSpline{uType, tType, IType, pType, kType, cType, scType, T, propsType} <:
     AbstractInterpolation{T}
@@ -600,12 +564,10 @@ struct QuadraticSpline{uType, tType, IType, pType, kType, cType, scType, T, prop
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function QuadraticSpline(
             u, t, I, p, k, c, sc, extrapolation_left,
-            extrapolation_right, cache_parameters, assume_linear_t
+            extrapolation_right, cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α), typeof(k),
@@ -623,7 +585,7 @@ struct QuadraticSpline{uType, tType, IType, pType, kType, cType, scType, T, prop
             Guesser(t),
             t_props,
             cache_parameters,
-            linear_lookup
+
         )
     end
 end
@@ -632,7 +594,7 @@ function QuadraticSpline(
         u::AbstractVector{<:Number}, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false, assume_linear_t = 1.0e-2
+        cache_parameters = false
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -649,12 +611,12 @@ function QuadraticSpline(
     p = QuadraticSplineParameterCache(u, t, k, c, sc, cache_parameters)
     A = QuadraticSpline(
         u, t, nothing, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return QuadraticSpline(
         u, t, I, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -662,7 +624,6 @@ function QuadraticSpline(
         u::AbstractVector, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
-        assume_linear_t = 1.0e-2
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -689,12 +650,12 @@ function QuadraticSpline(
     p = QuadraticSplineParameterCache(u, t, k, c, sc, cache_parameters)
     A = QuadraticSpline(
         u, t, nothing, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return QuadraticSpline(
         u, t, I, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -720,10 +681,6 @@ Second derivative on both ends are zero, which are also called "natural" boundar
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
     AbstractInterpolation{T}
@@ -738,12 +695,10 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function CubicSpline(
             u, t, I, p, h, z, extrapolation_left,
-            extrapolation_right, cache_parameters, assume_linear_t
+            extrapolation_right, cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.c₁),
@@ -760,7 +715,7 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
             Guesser(t),
             t_props,
             cache_parameters,
-            linear_lookup
+
         )
     end
 end
@@ -770,7 +725,6 @@ function CubicSpline(
         t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
-        assume_linear_t = 1.0e-2
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -796,16 +750,15 @@ function CubicSpline(
         1:(n + 1)
     )
     z = tA \ d
-    linear_lookup = seems_linear(assume_linear_t, t)
     p = CubicSplineParameterCache(u, h, z, cache_parameters)
     A = CubicSpline(
         u, t, nothing, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicSpline(
         u, t, I, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -814,7 +767,6 @@ function CubicSpline(
         t;
         extrapolation::ExtrapolationType.T = ExtrapolationType.None, extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
-        assume_linear_t = 1.0e-2
     ) where {T, N}
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -843,16 +795,15 @@ function CubicSpline(
     d_reshaped = reshape(d, prod(size(d)[1:(end - 1)]), :)
     z = (tA \ d_reshaped')'
     z = reshape(z, size(u)...)
-    linear_lookup = seems_linear(assume_linear_t, t)
     p = CubicSplineParameterCache(u, h, z, cache_parameters)
     A = CubicSpline(
         u, t, nothing, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicSpline(
         u, t, I, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -860,7 +811,6 @@ function CubicSpline(
         u::AbstractVector, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
-        assume_linear_t = 1.0e-2
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -885,12 +835,12 @@ function CubicSpline(
     p = CubicSplineParameterCache(u, h, z, cache_parameters)
     A = CubicSpline(
         u, t, nothing, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicSpline(
         u, t, I, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters, assume_linear_t
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -918,10 +868,6 @@ Extrapolation is a constant polynomial of the end points on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behavior for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsType} <:
     AbstractInterpolation{T}
@@ -938,7 +884,6 @@ struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsT
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    linear_lookup::Bool
     function BSplineInterpolation(
             u,
             t,
@@ -951,9 +896,7 @@ struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsT
             knotVecType,
             extrapolation_left,
             extrapolation_right,
-            assume_linear_t
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
@@ -971,8 +914,7 @@ struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsT
             extrapolation_left,
             extrapolation_right,
             Guesser(t),
-            t_props,
-            linear_lookup
+            t_props
         )
     end
 end
@@ -981,7 +923,7 @@ function BSplineInterpolation(
         u::AbstractVector, t, d, pVecType, knotVecType;
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, assume_linear_t = 1.0e-2
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -1052,7 +994,7 @@ function BSplineInterpolation(
     sc = zeros(eltype(t), n)
     return BSplineInterpolation(
         u, t, d, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right, assume_linear_t
+        extrapolation_left, extrapolation_right
     )
 end
 
@@ -1061,7 +1003,6 @@ function BSplineInterpolation(
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        assume_linear_t = 1.0e-2
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -1135,7 +1076,7 @@ function BSplineInterpolation(
     sc = zeros(eltype(t), n)
     return BSplineInterpolation(
         u, t, d, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right, assume_linear_t
+        extrapolation_left, extrapolation_right
     )
 end
 
@@ -1165,10 +1106,6 @@ Extrapolation is a constant polynomial of the end points on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
     AbstractInterpolation{T}
@@ -1186,7 +1123,6 @@ struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    linear_lookup::Bool
     function BSplineApprox(
             u,
             t,
@@ -1200,9 +1136,7 @@ struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
             knotVecType,
             extrapolation_left,
             extrapolation_right,
-            assume_linear_t
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
@@ -1221,8 +1155,7 @@ struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
             extrapolation_left,
             extrapolation_right,
             Guesser(t),
-            t_props,
-            linear_lookup
+            t_props
         )
     end
 end
@@ -1231,7 +1164,7 @@ function BSplineApprox(
         u::AbstractVector, t, d, h, pVecType, knotVecType;
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, assume_linear_t = 1.0e-2
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -1323,7 +1256,7 @@ function BSplineApprox(
     sc = zeros(eltype(t), h)
     return BSplineApprox(
         u, t, d, h, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right, assume_linear_t
+        extrapolation_left, extrapolation_right
     )
 end
 
@@ -1332,7 +1265,6 @@ function BSplineApprox(
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        assume_linear_t = 1.0e-2
     ) where {T, N}
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -1432,7 +1364,7 @@ function BSplineApprox(
     sc = zeros(eltype(t), h)
     return BSplineApprox(
         u, t, d, h, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right, assume_linear_t
+        extrapolation_left, extrapolation_right
     )
 end
 """
@@ -1457,10 +1389,6 @@ It is a Cubic Hermite interpolation, which is a piece-wise third degree polynomi
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct CubicHermiteSpline{uType, tType, IType, duType, pType, T, propsType} <:
     AbstractInterpolation{T}
@@ -1474,19 +1402,17 @@ struct CubicHermiteSpline{uType, tType, IType, duType, pType, T, propsType} <:
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function CubicHermiteSpline(
             du, u, t, I, p, extrapolation_left, extrapolation_right,
-            cache_parameters, assume_linear_t
+            cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
             typeof(p.c₁), eltype(u), typeof(t_props),
         }(
             du, u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters, linear_lookup
+            Guesser(t), t_props, cache_parameters
         )
     end
 end
@@ -1494,7 +1420,7 @@ end
 function CubicHermiteSpline(
         du, u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false, assume_linear_t = 1.0e-2
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
     )
     @assert length(u) == length(du) "Length of `u` is not equal to length of `du`."
     extrapolation_left,
@@ -1502,16 +1428,15 @@ function CubicHermiteSpline(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
-    linear_lookup = seems_linear(assume_linear_t, t)
     p = CubicHermiteParameterCache(du, u, t, cache_parameters)
     A = CubicHermiteSpline(
         du, u, t, nothing, p, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicHermiteSpline(
         du, u, t, I, p, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -1538,10 +1463,6 @@ section 3.4 for more details.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 function PCHIPInterpolation(u, t; kwargs...)
     u, t = munge_data(u, t)
@@ -1572,10 +1493,6 @@ It is a Quintic Hermite interpolation, which is a piece-wise fifth degree polyno
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 struct QuinticHermiteSpline{uType, tType, IType, duType, dduType, pType, T, propsType} <:
     AbstractInterpolation{T}
@@ -1590,19 +1507,17 @@ struct QuinticHermiteSpline{uType, tType, IType, duType, dduType, pType, T, prop
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     function QuinticHermiteSpline(
             ddu, du, u, t, I, p, extrapolation_left,
-            extrapolation_right, cache_parameters, assume_linear_t
+            extrapolation_right, cache_parameters
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
             typeof(ddu), typeof(p.c₁), eltype(u), typeof(t_props),
         }(
             ddu, du, u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters, linear_lookup
+            Guesser(t), t_props, cache_parameters
         )
     end
 end
@@ -1611,7 +1526,7 @@ function QuinticHermiteSpline(
         ddu, du, u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false, assume_linear_t = 1.0e-2
+        cache_parameters = false
     )
     @assert length(u) == length(du) == length(ddu) "Length of `u` is not equal to length of `du` or `ddu`."
     extrapolation_left,
@@ -1619,16 +1534,15 @@ function QuinticHermiteSpline(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
-    linear_lookup = seems_linear(assume_linear_t, t)
     p = QuinticHermiteParameterCache(ddu, du, u, t, cache_parameters)
     A = QuinticHermiteSpline(
         ddu, du, u, t, nothing, p, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
     I = cumulative_integral(A, cache_parameters)
     return QuinticHermiteSpline(
         ddu, du, u, t, I, p, extrapolation_left,
-        extrapolation_right, cache_parameters, linear_lookup
+        extrapolation_right, cache_parameters
     )
 end
 
@@ -1655,7 +1569,6 @@ struct SmoothArcLengthInterpolation{
     iguesser::Guesser{tType}
     t_props::propsType
     cache_parameters::Bool
-    linear_lookup::Bool
     out::Vector{P}
     derivative::Vector{P}
     in_place::Bool
@@ -1663,9 +1576,8 @@ struct SmoothArcLengthInterpolation{
             u, t, d, shape_itp, Δt_circle_segment, Δt_line_segment,
             center, radius, dir_1, dir_2, short_side_left,
             I, extrapolation_left, extrapolation_right,
-            assume_linear_t, out, derivative, in_place
+            out, derivative, in_place
         )
-        linear_lookup = seems_linear(assume_linear_t, t)
         t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), eltype(radius),
@@ -1674,7 +1586,7 @@ struct SmoothArcLengthInterpolation{
             u, t, d, shape_itp, Δt_circle_segment, Δt_line_segment,
             center, radius, dir_1, dir_2, short_side_left,
             I, nothing, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, false, linear_lookup, out, derivative, in_place
+            Guesser(t), t_props, false, out, derivative, in_place
         )
     end
 end
@@ -1712,10 +1624,6 @@ If you want to do this, construct the shape interpolation yourself and use the
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 function SmoothArcLengthInterpolation(
         u::AbstractMatrix{U};
@@ -1762,10 +1670,6 @@ Approximate the `shape_itp` with a C¹ unit speed interpolation using line segme
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 function SmoothArcLengthInterpolation(
         shape_itp::AbstractInterpolation;
@@ -1814,7 +1718,6 @@ end
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
         cache_parameters::Bool = false,
-        assume_linear_t = 1e-2,
         in_place::Bool = true)
 
 Make a C¹ smooth unit speed interpolation through the given data with the given tangents using line
@@ -1839,10 +1742,6 @@ segments and circle segments.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
-  - `assume_linear_t`: boolean value to specify a faster index lookup behaviour for
-    evenly-distributed abscissae. Alternatively, a numerical threshold may be specified
-    for a test based on the normalized standard deviation of the difference with respect
-    to the straight line (see [`looks_linear`](@ref)). Defaults to 1e-2.
 """
 function SmoothArcLengthInterpolation(
         u::AbstractMatrix,
@@ -1931,7 +1830,6 @@ function SmoothArcLengthInterpolation(
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
         cache_parameters::Bool = false,
-        assume_linear_t = 1.0e-2,
         in_place::Bool = true
     )
     N = size(u, 1)
@@ -1982,7 +1880,6 @@ function SmoothArcLengthInterpolation(
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
-    linear_lookup = seems_linear(assume_linear_t, t)
 
     out = Vector{P}(undef, N)
     derivative = Vector{P}(undef, N)
@@ -1990,6 +1887,6 @@ function SmoothArcLengthInterpolation(
     return SmoothArcLengthInterpolation(
         u, t, d, shape_itp, Δt_circle_segment, Δt_line_segment,
         center, radius, dir_1, dir_2, short_side_left,
-        nothing, extrapolation_left, extrapolation_right, linear_lookup, out, derivative, in_place
+        nothing, extrapolation_left, extrapolation_right, out, derivative, in_place
     )
 end
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 5e12edcf..4ba96885 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -167,29 +167,6 @@ function munge_data(U::AbstractArray{T, N}, t) where {T, N}
     return U, t
 end
 
-seems_linear(assume_linear_t::Bool, _) = assume_linear_t
-seems_linear(assume_linear_t::Number, t) = looks_linear(t; threshold = assume_linear_t)
-
-"""
-    looks_linear(t; threshold = 1e-2)
-
-Determine if the abscissae `t` are regularly distributed, taking the standard deviation of
-the difference between the array of abscissae with respect to the straight line linking
-its first and last elements, normalized by the range of `t`. If this standard deviation is
-below the given `threshold`, the vector looks linear (return true). Internal function -
-interface may change.
-"""
-function looks_linear(t; threshold = 1.0e-2)
-    length(t) <= 2 && return true
-    t_0, t_f = first(t), last(t)
-    t_span = t_f - t_0
-    tspan_over_N = t_span * length(t)^(-1)
-    norm_var = sum(
-        (t_i - t_0 - i * tspan_over_N)^2 for (i, t_i) in enumerate(t)
-    ) / (length(t) * t_span^2)
-    return norm_var < threshold^2
-end
-
 function get_idx(
         A::AbstractInterpolation, t, iguess::Integer; lb = 1,
         ub_shift = -1, idx_shift = 0, side = :last
diff --git a/test/Methods/derivative_tests.jl b/test/Methods/derivative_tests.jl
index df38b339..8f945ae3 100644
--- a/test/Methods/derivative_tests.jl
+++ b/test/Methods/derivative_tests.jl
@@ -49,7 +49,7 @@ function test_derivatives(method; args = [], kwargs = [], name::String)
             @test isapprox(fdiff, adiff, atol = 1.0e-8)
             @test isapprox(fdiff2, adiff2, atol = 1.0e-8)
             # Cached index
-            if hasproperty(func, :iguesser) && !func.iguesser.linear_lookup
+            if hasproperty(func, :t_props) && !func.t_props.is_uniform
                 @test abs(
                     func.iguesser.idx_prev[] -
                         searchsortedfirst(

From 23577581bb76fb4f09b3388ea7853e6c85eac7cf Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 11:42:30 -0400
Subject: [PATCH 03/24] Refactor get_idx to dispatch through Auto(A.t_props)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Both `get_idx` methods (integer hint and Guesser hint) used to hard-code
strategy choice — `BracketGallop` for the integer-hint path,
`GuesserHint` for the Guesser path. Both branches now build a single
`Auto(A.t_props)` strategy and pass the appropriate hint (`iguess` for
the integer overload, `iguess(t)` for the Guesser overload) to one
`searchsortedlast`/`searchsortedfirst` call.

The benefit is automatic O(1) closed-form lookup on exact-uniform `t`:
`Auto`'s per-query dispatch checks the cached `is_uniform` first and
short-circuits to `UniformStep` (which ignores the hint) when set,
matching what Interpolations.jl's uniform fast path does. For
non-uniform grids `_auto_pick` falls back to a hint-aware strategy
(BracketGallop / ExpFromLeft / SIMDLinearScan) by length and hint
validity, so the chained-ODE win from the previous branch is preserved.

The Guesser-hint path now stores the resulting `idx` back into
`iguess.idx_prev[]`, which `GuesserHint` used to do internally — needed
so the next correlated lookup gets the right `idx_prev` when `Auto`
hasn't gone through the uniform short-circuit.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_utils.jl | 35 +++++++++++++++++------------------
 1 file changed, 17 insertions(+), 18 deletions(-)

diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 4ba96885..cc04f440 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -173,19 +173,15 @@ function get_idx(
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    return if side == :last
-        clamp(
-            searchsortedlast(FindFirstFunctions.BracketGallop(), tvec, t, iguess) +
-                idx_shift, lb, ub
-        )
+    strat = FindFirstFunctions.Auto(A.t_props)
+    raw = if side == :last
+        searchsortedlast(strat, tvec, t, iguess)
     elseif side == :first
-        clamp(
-            searchsortedfirst(FindFirstFunctions.BracketGallop(), tvec, t, iguess) +
-                idx_shift, lb, ub
-        )
+        searchsortedfirst(strat, tvec, t, iguess)
     else
         error("side must be :first or :last")
     end
+    return clamp(raw + idx_shift, lb, ub)
 end
 
 function get_idx(
@@ -194,19 +190,22 @@ function get_idx(
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    return if side == :last
-        clamp(
-            searchsortedlast(FindFirstFunctions.GuesserHint(iguess), tvec, t) +
-                idx_shift, lb, ub
-        )
+    strat = FindFirstFunctions.Auto(A.t_props)
+    # `iguess(t)` gives a linear-extrapolation hint when `t` looks linear and
+    # falls back to the cached `idx_prev` otherwise. `Auto` short-circuits to
+    # `UniformStep` for exact-uniform grids and ignores the hint there; for
+    # near-uniform-but-not-uniform grids the linear hint still beats `idx_prev`.
+    hint = iguess(t)
+    raw = if side == :last
+        searchsortedlast(strat, tvec, t, hint)
     elseif side == :first
-        clamp(
-            searchsortedfirst(FindFirstFunctions.GuesserHint(iguess), tvec, t) +
-                idx_shift, lb, ub
-        )
+        searchsortedfirst(strat, tvec, t, hint)
     else
         error("side must be :first or :last")
     end
+    idx = clamp(raw + idx_shift, lb, ub)
+    iguess.idx_prev[] = idx
+    return idx
 end
 
 cumulative_integral(::AbstractInterpolation, ::Bool) = nothing

From dcd7207c87cee2e44ee8d3e918c0c68bef915b27 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 11:43:19 -0400
Subject: [PATCH 04/24] =?UTF-8?q?Fix=20O(n=C2=B2)=20QuadraticSpline=20cons?=
 =?UTF-8?q?truction=20in=20spline=5Fcoefficients!?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`spline_coefficients!` located the active knot index with
`findfirst(x -> x > u, k)` — an O(n) linear scan on a sorted vector — on
every call. `quadratic_spline_params` calls it n times during
construction, so the constructor was O(n²) (~7 s for n=100k vs ~14 ms
for Dierckx). The per-query eval path (`cache_parameters=false`,
default) also paid O(n) per evaluation.

Two changes:

  1. Factor the locator-dependent body of `spline_coefficients!` into
     `_spline_coefficients_body!(N, d, k, u, i)`. The scalar
     `spline_coefficients!` now calls `searchsortedlast(k, u)` —
     O(log n) on the sorted knot vector — and delegates to the body.

  2. `quadratic_spline_params` maintains a running locator (the next
     iteration's `searchsortedlast` index is ≥ the current's, because
     `t` is sorted) and advances it amortised O(1) per knot. Total
     construction is O(n).

Bench (n=100k uniform, cache_parameters=false):
  QuadraticSpline construct: 6914 ms → 7.9 ms  (~880×)
  QuadraticSpline eval:        57.5 μs → 14.4 μs (~4×)

`spline_coefficients!` keeps `N .= zero(u)` at the top — BSpline
derivative paths (`_derivative(::BSplineInterpolation, …)`) read the
entire `sc` vector, so positions outside the body's
`nonzero_coefficient_idxs` window must be zero on every call. Dropping
that zero pass was an attempted further optimisation that silently
broke BSpline derivatives by leaking stale values from previous
queries.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_utils.jl | 65 +++++++++++++++++++++++++++++++-------
 1 file changed, 54 insertions(+), 11 deletions(-)

diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index cc04f440..0fc7e761 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -30,6 +30,10 @@ function findRequiredIdxs!(A::LagrangeInterpolation, t, idx)
 end
 
 function spline_coefficients!(N, d, k, u::Number)
+    # `N` is zeroed because BSpline derivative paths read the full vector
+    # (see `_derivative(::BSplineInterpolation, …)` in `derivatives.jl`).
+    # Positions outside the body's `(i-d):i` write window must be zero or
+    # stale values from previous calls would leak in.
     N .= zero(u)
     if u == k[1]
         N[1] = one(u)
@@ -38,18 +42,27 @@ function spline_coefficients!(N, d, k, u::Number)
         N[end] = one(u)
         return length(N):length(N)
     else
-        i = findfirst(x -> x > u, k)::Int - 1
-        N[i] = one(u)
-        for deg in 1:d
-            N[i - deg] = (k[i + 1] - u) / (k[i + 1] - k[i - deg + 1]) * N[i - deg + 1]
-            for j in (i - deg + 1):(i - 1)
-                N[j] = (u - k[j]) / (k[j + deg] - k[j]) * N[j] +
-                    (k[j + deg + 1] - u) / (k[j + deg + 1] - k[j + 1]) * N[j + 1]
-            end
-            N[i] = (u - k[i]) / (k[i + deg] - k[i]) * N[i]
+        # `k` is sorted; the legacy `findfirst(x -> x > u, k) - 1` did an O(n)
+        # linear scan. `searchsortedlast` returns the same index in O(log n).
+        i = searchsortedlast(k, u)
+        return _spline_coefficients_body!(N, d, k, u, i)
+    end
+end
+
+# Body of `spline_coefficients!` after the locator index `i` has been
+# determined. Used by `spline_coefficients!` (logarithmic locator) and by
+# `quadratic_spline_params` (O(1) amortised running locator).
+function _spline_coefficients_body!(N, d, k, u, i)
+    N[i] = one(u)
+    for deg in 1:d
+        N[i - deg] = (k[i + 1] - u) / (k[i + 1] - k[i - deg + 1]) * N[i - deg + 1]
+        for j in (i - deg + 1):(i - 1)
+            N[j] = (u - k[j]) / (k[j + deg] - k[j]) * N[j] +
+                (k[j + deg + 1] - u) / (k[j + deg + 1] - k[j + 1]) * N[j + 1]
         end
-        return (i - d):i
+        N[i] = (u - k[i]) / (k[i + deg] - k[i]) * N[i]
     end
+    return (i - d):i
 end
 
 function spline_coefficients!(N, d, k, u::AbstractVector)
@@ -86,11 +99,41 @@ function quadratic_spline_params(t::AbstractVector, sc::AbstractVector)
     diag_hi = Vector{dtype_sc}(undef, n - 1)
     diag_lo = Vector{dtype_sc}(undef, n - 1)
 
+    # `t` is sorted and `k` is built from `t`, so the locator
+    # `searchsortedlast(k, tᵢ)` is non-decreasing in `i`. Maintain a running
+    # pointer to advance amortised O(1) per knot — total O(n) instead of the
+    # O(n²) `findfirst` scan or O(n log n) per-call `searchsortedlast`.
+    nk = length(k)
+    d = 2
+    fill!(sc, zero(dtype_sc))
+    locator = 1
     for (i, tᵢ) in enumerate(t)
-        spline_coefficients!(sc, 2, k, tᵢ)
+        if tᵢ == k[1] || tᵢ == k[end]
+            # `t[1] == k[1]` and `t[end] == k[end]` by construction, so this
+            # branch only fires for `i == 1` (sc[1] = 1) and `i == n`
+            # (sc[end] = 1). Read directly without touching `sc`.
+            on_first = tᵢ == k[1]
+            diag[i] = (on_first && i == 1) || (!on_first && i == length(sc)) ?
+                one(dtype_sc) : zero(dtype_sc)
+            (i > 1) && (diag_lo[i - 1] = zero(dtype_sc))
+            (i < n) && (diag_hi[i] = zero(dtype_sc))
+            continue
+        end
+        # Advance the running locator until `k[locator+1] > tᵢ` — equivalent
+        # to `searchsortedlast(k, tᵢ)` on monotone-increasing `tᵢ` inputs.
+        while locator < nk && k[locator + 1] <= tᵢ
+            locator += 1
+        end
+        _spline_coefficients_body!(sc, d, k, tᵢ, locator)
         diag[i] = sc[i]
         (i > 1) && (diag_lo[i - 1] = sc[i - 1])
         (i < n) && (diag_hi[i] = sc[i + 1])
+        # The body writes only `sc[locator-d:locator]`; zero those entries
+        # so the next iteration starts with `sc .== 0` again (the body
+        # assumes positions outside its write window are already zero).
+        for j in (locator - d):locator
+            sc[j] = zero(dtype_sc)
+        end
     end
 
     A = Tridiagonal(diag_lo, diag, diag_hi)

From 9b21e37e6b14964c061f6090e05d954244e8766c Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 16:54:08 -0400
Subject: [PATCH 05/24] Add `search_properties` constructor kwarg to all
 interpolation types
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Breaking change: every interpolation constructor that previously built
`t_props = FindFirstFunctions.SearchProperties(t)` internally now accepts an
optional `search_properties::Union{Nothing,FindFirstFunctions.SearchProperties}`
keyword. When omitted (the default), behaviour is identical to before:
`SearchProperties(t)` is built once and shared between the no-integral and
with-integral inner constructor calls — fixing a pre-existing redundancy.

When supplied, the caller's `SearchProperties` is used as-is, which gives
domain experts the ability to opt into FFF strategies that the data-driven
probes can't detect cheaply:

  - `LinearInterpolation(u, t; search_properties =
        SearchProperties(t; is_uniform = true))`
    opts a `Vector` with float-noise into `UniformStep`'s closed-form O(1)
    lookup, which the probe rejects (because float-noise exceeds the
    1e-12 uniformity tolerance).
  - Sharing a single populated `SearchProperties` across many interpolations
    that share `t` avoids redundant probe work.

This subsumes the old `assume_linear_t` knob (already dropped on this
branch) and is more powerful — callers control every property in
`SearchProperties`, not just the linearity flag.

The inner struct constructors (called twice during construction for the
cumulative-integral pre-build path) now take `t_props` as a positional
argument, so the probe runs at most once per interpolation regardless.

All 15 cache types (`LinearInterpolation`, `QuadraticInterpolation`,
`LagrangeInterpolation`, `AkimaInterpolation`, `ConstantInterpolation`,
`SmoothedConstantInterpolation`, `QuadraticSpline`, `CubicSpline`,
`BSplineInterpolation`, `BSplineApprox`, `CubicHermiteSpline`,
`QuinticHermiteSpline`, `SmoothArcLengthInterpolation`,
`LinearInterpolationIntInv`, `ConstantInterpolationIntInv`) updated.

Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/integral_inverses.jl    |  23 +++--
 src/interpolation_caches.jl | 177 +++++++++++++++++++++---------------
 2 files changed, 120 insertions(+), 80 deletions(-)

diff --git a/src/integral_inverses.jl b/src/integral_inverses.jl
index 2e375aae..936f5ab4 100644
--- a/src/integral_inverses.jl
+++ b/src/integral_inverses.jl
@@ -42,8 +42,9 @@ struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType} <:
     iguesser::Guesser{tType}
     t_props::propsType
     itp::itpType
-    function LinearInterpolationIntInv(u, t, A, extrapolation_left, extrapolation_right)
-        t_props = FindFirstFunctions.SearchProperties(t)
+    function LinearInterpolationIntInv(
+            u, t, A, extrapolation_left, extrapolation_right, t_props,
+        )
         return new{typeof(u), typeof(t), typeof(A), eltype(u), typeof(t_props)}(
             u, t, extrapolation_left, extrapolation_right, Guesser(t), t_props, A
         )
@@ -63,12 +64,14 @@ end
 function invert_integral(
         A::LinearInterpolation{<:AbstractVector{<:Number}};
         extrapolation_left::ExtrapolationType.T = A.extrapolation_left,
-        extrapolation_right::ExtrapolationType.T = A.extrapolation_right
+        extrapolation_right::ExtrapolationType.T = A.extrapolation_right,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     !invertible_integral(A) && throw(IntegralNotInvertibleError())
-
+    t_I = get_I(A)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t_I))
     return LinearInterpolationIntInv(
-        A.t, get_I(A), A, extrapolation_left, extrapolation_right
+        A.t, t_I, A, extrapolation_left, extrapolation_right, t_props
     )
 end
 
@@ -105,9 +108,8 @@ struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType} <:
     t_props::propsType
     itp::itpType
     function ConstantInterpolationIntInv(
-            u, t, A, extrapolation_left, extrapolation_right
+            u, t, A, extrapolation_left, extrapolation_right, t_props,
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{typeof(u), typeof(t), typeof(A), eltype(u), typeof(t_props)}(
             u, t, extrapolation_left, extrapolation_right, Guesser(t), t_props, A
         )
@@ -121,11 +123,14 @@ end
 function invert_integral(
         A::ConstantInterpolation{<:AbstractVector{<:Number}};
         extrapolation_left::ExtrapolationType.T = A.extrapolation_left,
-        extrapolation_right::ExtrapolationType.T = A.extrapolation_right
+        extrapolation_right::ExtrapolationType.T = A.extrapolation_right,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     !invertible_integral(A) && throw(IntegralNotInvertibleError())
+    t_I = get_I(A)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t_I))
     return ConstantInterpolationIntInv(
-        A.t, get_I(A), A, extrapolation_left, extrapolation_right
+        A.t, t_I, A, extrapolation_left, extrapolation_right, t_props
     )
 end
 
diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index 107dfc7f..1a94fc07 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -36,9 +36,8 @@ struct LinearInterpolation{uType, tType, IType, pType, T, propsType} <:
     cache_parameters::Bool
     function LinearInterpolation(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            cache_parameters
+            cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.slope),
             eltype(u), typeof(t_props),
@@ -52,22 +51,25 @@ end
 function LinearInterpolation(
         u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     p = LinearParameterCache(u, t, cache_parameters)
     A = LinearInterpolation(
         u, t, nothing, p, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return LinearInterpolation(
         u, t, I, p, extrapolation_left, extrapolation_right,
-        cache_parameters
+        cache_parameters, t_props
     )
 end
 
@@ -110,11 +112,10 @@ struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType} <:
     cache_parameters::Bool
     function QuadraticInterpolation(
             u, t, I, p, mode, extrapolation_left,
-            extrapolation_right, cache_parameters
+            extrapolation_right, cache_parameters, t_props
         )
         mode ∈ (:Forward, :Backward) ||
             error("mode should be :Forward or :Backward for QuadraticInterpolation")
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α),
             eltype(u), typeof(t_props),
@@ -128,22 +129,25 @@ end
 function QuadraticInterpolation(
         u, t, mode; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     p = QuadraticParameterCache(u, t, cache_parameters, mode)
     A = QuadraticInterpolation(
         u, t, nothing, p, mode, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return QuadraticInterpolation(
         u, t, I, p, mode, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
@@ -184,11 +188,10 @@ struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    function LagrangeInterpolation(u, t, n, extrapolation_left, extrapolation_right)
+    function LagrangeInterpolation(u, t, n, extrapolation_left, extrapolation_right, t_props)
         bcache = zeros(eltype(u[1]), n + 1)
         idxs = zeros(Int, n + 1)
         fill!(bcache, NaN)
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{typeof(u), typeof(t), eltype(u), typeof(bcache), typeof(t_props)}(
             u,
             t,
@@ -207,7 +210,8 @@ function LagrangeInterpolation(
         u, t, n = length(t) - 1;
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
@@ -217,7 +221,8 @@ function LagrangeInterpolation(
     if n != length(t) - 1
         error("Currently only n=length(t) - 1 is supported")
     end
-    return LagrangeInterpolation(u, t, n, extrapolation_left, extrapolation_right)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
+    return LagrangeInterpolation(u, t, n, extrapolation_left, extrapolation_right, t_props)
 end
 
 """
@@ -263,9 +268,8 @@ struct AkimaInterpolation{uType, tType, IType, bType, cType, dType, T, propsType
     cache_parameters::Bool
     function AkimaInterpolation(
             u, t, I, b, c, d, extrapolation_left,
-            extrapolation_right, cache_parameters
+            extrapolation_right, cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(b), typeof(c),
             typeof(d), eltype(u), typeof(t_props),
@@ -350,13 +354,16 @@ function AkimaInterpolation(
         u, t; modified::Bool = false,
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t)
     T = eltype(u)
     b = Vector{T}(undef, n)
@@ -366,12 +373,12 @@ function AkimaInterpolation(
 
     A = AkimaInterpolation(
         u, t, nothing, b, c, d, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return AkimaInterpolation(
         u, t, I, b, c, d, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
@@ -414,9 +421,8 @@ struct ConstantInterpolation{uType, tType, IType, T, propsType} <:
     cache_parameters::Bool
     function ConstantInterpolation(
             u, t, I, dir, extrapolation_left, extrapolation_right,
-            cache_parameters
+            cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{typeof(u), typeof(t), typeof(I), eltype(u), typeof(t_props)}(
             u, t, I, nothing, dir, extrapolation_left, extrapolation_right,
             Guesser(t), t_props, cache_parameters
@@ -428,21 +434,23 @@ function ConstantInterpolation(
         u, t; dir = :left, extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     A = ConstantInterpolation(
         u, t, nothing, dir, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return ConstantInterpolation(
         u, t, I, dir, extrapolation_left, extrapolation_right,
-        cache_parameters
+        cache_parameters, t_props
     )
 end
 
@@ -489,9 +497,8 @@ struct SmoothedConstantInterpolation{
     cache_parameters::Bool
     function SmoothedConstantInterpolation(
             u, t, I, p, d_max, extrapolation_left,
-            extrapolation_right, cache_parameters
+            extrapolation_right, cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.d),
             typeof(p.c), typeof(d_max), eltype(u), typeof(t_props),
@@ -506,24 +513,26 @@ function SmoothedConstantInterpolation(
         u, t; d_max = Inf, extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     p = SmoothedConstantParameterCache(
         u, t, cache_parameters, d_max, extrapolation_left, extrapolation_right
     )
     A = SmoothedConstantInterpolation(
         u, t, nothing, p, d_max, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return SmoothedConstantInterpolation(
         u, t, I, p, d_max, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
@@ -566,9 +575,8 @@ struct QuadraticSpline{uType, tType, IType, pType, kType, cType, scType, T, prop
     cache_parameters::Bool
     function QuadraticSpline(
             u, t, I, p, k, c, sc, extrapolation_left,
-            extrapolation_right, cache_parameters
+            extrapolation_right, cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α), typeof(k),
             typeof(c), typeof(sc), eltype(u), typeof(t_props),
@@ -594,13 +602,15 @@ function QuadraticSpline(
         u::AbstractVector{<:Number}, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
 
     n = length(t)
     dtype_sc = typeof(one(eltype(t)) / one(eltype(t)))
@@ -611,25 +621,28 @@ function QuadraticSpline(
     p = QuadraticSplineParameterCache(u, t, k, c, sc, cache_parameters)
     A = QuadraticSpline(
         u, t, nothing, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return QuadraticSpline(
         u, t, I, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
 function QuadraticSpline(
         u::AbstractVector, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
 
     n = length(t)
     dtype_sc = typeof(one(eltype(t)) / one(eltype(t)))
@@ -650,12 +663,12 @@ function QuadraticSpline(
     p = QuadraticSplineParameterCache(u, t, k, c, sc, cache_parameters)
     A = QuadraticSpline(
         u, t, nothing, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return QuadraticSpline(
         u, t, I, p, k, c, sc, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
@@ -697,9 +710,8 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
     cache_parameters::Bool
     function CubicSpline(
             u, t, I, p, h, z, extrapolation_left,
-            extrapolation_right, cache_parameters
+            extrapolation_right, cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.c₁),
             typeof(h), typeof(z), eltype(u), typeof(t_props),
@@ -724,13 +736,16 @@ function CubicSpline(
         u::AbstractVector{<:Number},
         t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t) - 1
     h = vcat(0, map(k -> t[k + 1] - t[k], 1:(length(t) - 1)), 0)
     dl = vcat(h[2:n], zero(eltype(h)))
@@ -753,26 +768,30 @@ function CubicSpline(
     p = CubicSplineParameterCache(u, h, z, cache_parameters)
     A = CubicSpline(
         u, t, nothing, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicSpline(
         u, t, I, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
 function CubicSpline(
         u::AbstractArray{T, N},
         t;
-        extrapolation::ExtrapolationType.T = ExtrapolationType.None, extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
+        extrapolation::ExtrapolationType.T = ExtrapolationType.None,
+        extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     ) where {T, N}
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t) - 1
     h = vcat(0, map(k -> t[k + 1] - t[k], 1:(length(t) - 1)), 0)
     dl = vcat(h[2:n], zero(eltype(h)))
@@ -798,25 +817,28 @@ function CubicSpline(
     p = CubicSplineParameterCache(u, h, z, cache_parameters)
     A = CubicSpline(
         u, t, nothing, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicSpline(
         u, t, I, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
 function CubicSpline(
         u::AbstractVector, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false,
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t) - 1
     h = vcat(0, map(k -> t[k + 1] - t[k], 1:(length(t) - 1)), 0)
     dl = vcat(h[2:n], zero(eltype(h)))
@@ -835,12 +857,12 @@ function CubicSpline(
     p = CubicSplineParameterCache(u, h, z, cache_parameters)
     A = CubicSpline(
         u, t, nothing, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicSpline(
         u, t, I, p, h[1:(n + 1)], z, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
@@ -896,8 +918,8 @@ struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsT
             knotVecType,
             extrapolation_left,
             extrapolation_right,
+            t_props,
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
             typeof(c), typeof(sc), eltype(u), typeof(t_props),
@@ -923,13 +945,15 @@ function BSplineInterpolation(
         u::AbstractVector, t, d, pVecType, knotVecType;
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t)
     n < d + 1 && error("BSplineInterpolation needs at least d + 1, i.e. $(d + 1) points.")
     s = zero(eltype(u))
@@ -994,7 +1018,7 @@ function BSplineInterpolation(
     sc = zeros(eltype(t), n)
     return BSplineInterpolation(
         u, t, d, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right
+        extrapolation_left, extrapolation_right, t_props
     )
 end
 
@@ -1003,12 +1027,14 @@ function BSplineInterpolation(
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing,
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t)
     n < d + 1 && error("BSplineInterpolation needs at least d + 1, i.e. $(d + 1) points.")
     s = zero(eltype(u))
@@ -1076,7 +1102,7 @@ function BSplineInterpolation(
     sc = zeros(eltype(t), n)
     return BSplineInterpolation(
         u, t, d, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right
+        extrapolation_left, extrapolation_right, t_props
     )
 end
 
@@ -1136,8 +1162,8 @@ struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
             knotVecType,
             extrapolation_left,
             extrapolation_right,
+            t_props,
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
             typeof(c), typeof(sc), eltype(u), typeof(t_props),
@@ -1164,13 +1190,15 @@ function BSplineApprox(
         u::AbstractVector, t, d, h, pVecType, knotVecType;
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t)
     h < d + 1 && error("BSplineApprox needs at least d + 1, i.e. $(d + 1) control points.")
     s = zero(eltype(u))
@@ -1256,7 +1284,7 @@ function BSplineApprox(
     sc = zeros(eltype(t), h)
     return BSplineApprox(
         u, t, d, h, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right
+        extrapolation_left, extrapolation_right, t_props
     )
 end
 
@@ -1265,12 +1293,14 @@ function BSplineApprox(
         extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing,
     ) where {T, N}
     extrapolation_left,
         extrapolation_right = munge_extrapolation(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     n = length(t)
     h < d + 1 && error("BSplineApprox needs at least d + 1, i.e. $(d + 1) control points.")
     s = zero(eltype(u))
@@ -1364,7 +1394,7 @@ function BSplineApprox(
     sc = zeros(eltype(t), h)
     return BSplineApprox(
         u, t, d, h, p, k, c, sc, pVecType, knotVecType,
-        extrapolation_left, extrapolation_right
+        extrapolation_left, extrapolation_right, t_props
     )
 end
 """
@@ -1404,9 +1434,8 @@ struct CubicHermiteSpline{uType, tType, IType, duType, pType, T, propsType} <:
     cache_parameters::Bool
     function CubicHermiteSpline(
             du, u, t, I, p, extrapolation_left, extrapolation_right,
-            cache_parameters
+            cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
             typeof(p.c₁), eltype(u), typeof(t_props),
@@ -1420,7 +1449,9 @@ end
 function CubicHermiteSpline(
         du, u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
-        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None, cache_parameters = false
+        extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     @assert length(u) == length(du) "Length of `u` is not equal to length of `du`."
     extrapolation_left,
@@ -1428,15 +1459,16 @@ function CubicHermiteSpline(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     p = CubicHermiteParameterCache(du, u, t, cache_parameters)
     A = CubicHermiteSpline(
         du, u, t, nothing, p, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return CubicHermiteSpline(
         du, u, t, I, p, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
@@ -1509,9 +1541,8 @@ struct QuinticHermiteSpline{uType, tType, IType, duType, dduType, pType, T, prop
     cache_parameters::Bool
     function QuinticHermiteSpline(
             ddu, du, u, t, I, p, extrapolation_left,
-            extrapolation_right, cache_parameters
+            extrapolation_right, cache_parameters, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
             typeof(ddu), typeof(p.c₁), eltype(u), typeof(t_props),
@@ -1526,7 +1557,8 @@ function QuinticHermiteSpline(
         ddu, du, u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
-        cache_parameters = false
+        cache_parameters = false,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     @assert length(u) == length(du) == length(ddu) "Length of `u` is not equal to length of `du` or `ddu`."
     extrapolation_left,
@@ -1534,15 +1566,16 @@ function QuinticHermiteSpline(
         extrapolation, extrapolation_left, extrapolation_right
     )
     u, t = munge_data(u, t)
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     p = QuinticHermiteParameterCache(ddu, du, u, t, cache_parameters)
     A = QuinticHermiteSpline(
         ddu, du, u, t, nothing, p, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
     I = cumulative_integral(A, cache_parameters)
     return QuinticHermiteSpline(
         ddu, du, u, t, I, p, extrapolation_left,
-        extrapolation_right, cache_parameters
+        extrapolation_right, cache_parameters, t_props
     )
 end
 
@@ -1576,9 +1609,8 @@ struct SmoothArcLengthInterpolation{
             u, t, d, shape_itp, Δt_circle_segment, Δt_line_segment,
             center, radius, dir_1, dir_2, short_side_left,
             I, extrapolation_left, extrapolation_right,
-            out, derivative, in_place
+            out, derivative, in_place, t_props
         )
-        t_props = FindFirstFunctions.SearchProperties(t)
         return new{
             typeof(u), typeof(t), typeof(I), eltype(radius),
             eltype(d), typeof(shape_itp), eltype(u), typeof(t_props),
@@ -1830,7 +1862,8 @@ function SmoothArcLengthInterpolation(
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_right::ExtrapolationType.T = ExtrapolationType.None,
         cache_parameters::Bool = false,
-        in_place::Bool = true
+        in_place::Bool = true,
+        search_properties::Union{Nothing, FindFirstFunctions.SearchProperties} = nothing
     )
     N = size(u, 1)
     n_circle_arcs = size(u, 2) - 1
@@ -1884,9 +1917,11 @@ function SmoothArcLengthInterpolation(
     out = Vector{P}(undef, N)
     derivative = Vector{P}(undef, N)
 
+    t_props = something(search_properties, FindFirstFunctions.SearchProperties(t))
     return SmoothArcLengthInterpolation(
         u, t, d, shape_itp, Δt_circle_segment, Δt_line_segment,
         center, radius, dir_1, dir_2, short_side_left,
-        nothing, extrapolation_left, extrapolation_right, out, derivative, in_place
+        nothing, extrapolation_left, extrapolation_right,
+        out, derivative, in_place, t_props
     )
 end

From ccef1350b29f6c85c5f1bfd5f8f4d083e9a435aa Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 16:54:24 -0400
Subject: [PATCH 06/24] Add FastInterpolations.jl to cross-library bench + port
 their advertised bench
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

  - Add `FastInterpolations` as a build/eval target for every supported
    algorithm in `bench/cross_library_comparison.jl`: Linear, CubicSpline,
    QuadraticSpline, Akima, and PCHIP (the last one as "FastInterpolations
    (PCHIP)" alongside the existing PCHIPInterpolation entry).
  - Add `bench/fast_interpolations_bench.jl`, a port of FastInterpolations'
    own `benchmark/interpolation_benchmark.jl` from upstream commit
    `616b106b`. Mimics the fusion-physics matrix-of-interpolants workload
    they advertise on their README: `mpert × mpert` independent
    interpolants on a uniform 1D grid, evaluated at `n_eval` cubic-spaced
    query points. Compares against Interpolations.jl, DataInterpolations.jl,
    Dierckx.jl, and FastInterpolations' `Series` interpolant. CLI matches
    the upstream: `--linear | --quadratic | --cubic | --constant` ×
    `--tiny | --small | --default | --large`.

The bench/Project.toml gains a `FastInterpolations` dep.

Read-only audit — no upstream changes to FastInterpolations.jl.

Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 bench/Project.toml                 |   1 +
 bench/cross_library_comparison.jl  |  47 +++-
 bench/fast_interpolations_bench.jl | 383 +++++++++++++++++++++++++++++
 3 files changed, 426 insertions(+), 5 deletions(-)
 create mode 100644 bench/fast_interpolations_bench.jl

diff --git a/bench/Project.toml b/bench/Project.toml
index ba5ab73c..1c541df8 100644
--- a/bench/Project.toml
+++ b/bench/Project.toml
@@ -3,5 +3,6 @@ BasicInterpolators = "26cce99e-4866-4b6d-ab74-862489e035e0"
 BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
 DataInterpolations = "82cc6244-b520-54b8-b5a6-8a565e85f1d0"
 Dierckx = "39dd38d3-220a-591b-8e3c-4c3a8c710a94"
+FastInterpolations = "9ea80cae-fc13-4c00-8066-6eaedb12f34b"
 Interpolations = "a98d9a8b-a2ab-59e6-89dd-64a1c18fca59"
 PCHIPInterpolation = "afe20452-48d1-4729-9a8b-50fb251f06cd"
diff --git a/bench/cross_library_comparison.jl b/bench/cross_library_comparison.jl
index 20eb149e..24bcbc23 100644
--- a/bench/cross_library_comparison.jl
+++ b/bench/cross_library_comparison.jl
@@ -2,7 +2,8 @@
 Cross-library 1D interpolation benchmark for DataInterpolations.jl.
 
 Compares DataInterpolations.jl (PR #529 branch, with cached Auto(t_props)) against
-Interpolations.jl, Dierckx.jl, BasicInterpolators.jl, and PCHIPInterpolation.jl.
+Interpolations.jl, Dierckx.jl, BasicInterpolators.jl, PCHIPInterpolation.jl,
+and FastInterpolations.jl.
 
 Usage:
     julia +1.11 --project=bench bench/cross_library_comparison.jl
@@ -27,12 +28,14 @@ using Interpolations
 using Dierckx
 using BasicInterpolators
 using PCHIPInterpolation
+using FastInterpolations
 
 const DI = DataInterpolations
 const ITP = Interpolations
 const DRX = Dierckx
 const BI = BasicInterpolators
 const PCHIP = PCHIPInterpolation
+const FI = FastInterpolations
 
 const RNG = MersenneTwister(0x00C0FFEE)
 
@@ -127,19 +130,28 @@ build_itp_linear_uniform(u, t) = ITP.linear_interpolation(t, u) # t may be a ran
 build_itp_linear_nonuniform(u, t) = ITP.interpolate((_vec(t),), _vec(u), ITP.Gridded(ITP.Linear()))
 build_drx_linear(u, t) = DRX.Spline1D(_vec(t), _vec(u); k = 1, bc = "extrapolate")
 build_bi_linear(u, t) = BI.LinearInterpolator(_vec(t), _vec(u), BI.WeakBoundaries())
+# FastInterpolations accepts both AbstractRange and Vector; passing the raw `t` so
+# uniform-grid (range) builds keep their O(1) DirectSearch optimization.
+build_fi_linear(u, t) = FI.linear_interp(t, _vec(u))
 
 # --- Cubic spline (natural BC for DI, Interpolations) --------------------
 build_di_cubic(u, t) = DI.CubicSpline(_vec(u), _vec(t))
 build_itp_cubic_uniform(u, t) = ITP.cubic_spline_interpolation(t, u)
 build_drx_cubic(u, t) = DRX.Spline1D(_vec(t), _vec(u); k = 3, bc = "extrapolate")
 build_bi_cubic(u, t) = BI.CubicSplineInterpolator(_vec(t), _vec(u), BI.WeakBoundaries())
+# FastInterpolations cubic: default BC is `CubicFit()` (cubic polynomial fit at
+# endpoints), not natural BC. Numerically different in the boundary cells from
+# DI's natural cubic but matches in the interior — comparable for speed.
+build_fi_cubic(u, t) = FI.cubic_interp(t, _vec(u))
 
 # --- Quadratic spline ----------------------------------------------------
 build_di_quadratic(u, t) = DI.QuadraticSpline(_vec(u), _vec(t))
 build_drx_quadratic(u, t) = DRX.Spline1D(_vec(t), _vec(u); k = 2, bc = "extrapolate")
+build_fi_quadratic(u, t) = FI.quadratic_interp(t, _vec(u))
 
 # --- Akima ---------------------------------------------------------------
 build_di_akima(u, t) = DI.AkimaInterpolation(_vec(u), _vec(t))
+build_fi_akima(u, t) = FI.akima_interp(t, _vec(u))
 
 # --- PCHIP / monotone cubic Hermite -------------------------------------
 function build_di_cubic_hermite(u, t)
@@ -155,6 +167,8 @@ function build_di_cubic_hermite(u, t)
     return DI.CubicHermiteSpline(du, uv, tv)
 end
 build_pchip(u, t) = PCHIP.Interpolator(_vec(t), _vec(u))
+# FastInterpolations PCHIP (Fritsch-Carlson monotone cubic Hermite).
+build_fi_pchip(u, t) = FI.pchip_interp(t, _vec(u))
 
 # --- Single-eval dispatch -----------------------------------------------
 # DI, Dierckx, BasicInterpolators all use `A(x)`
@@ -174,6 +188,8 @@ batched_eval_drx!(out, A::DRX.Spline1D, tt) = (out .= DRX.evaluate.(Ref(A), tt);
 batched_eval_bi!(out, A, tt) = (out .= A.(tt); out)
 # PCHIP: broadcast
 batched_eval_pchip!(out, A, tt) = (out .= A.(tt); out)
+# FastInterpolations: `A(out, xq)` in-place (zero-alloc, with AutoSearch).
+batched_eval_fi!(out, A, tt) = (A(out, tt); out)
 
 # -----------------------------------------------------------------------------
 # Verification: every library should agree on the same query to within tol
@@ -218,6 +234,7 @@ const ALGORITHMS = let
             "Interpolations (gridded)" => build_itp_linear_nonuniform,
             "Dierckx (k=1)" => build_drx_linear,
             "BasicInterpolators" => build_bi_linear,
+            "FastInterpolations" => build_fi_linear,
         ),
         batched! = Dict(
             "DataInterpolations" => batched_eval_di!,
@@ -225,6 +242,7 @@ const ALGORITHMS = let
             "Interpolations (gridded)" => batched_eval_itp!,
             "Dierckx (k=1)" => batched_eval_drx!,
             "BasicInterpolators" => batched_eval_bi!,
+            "FastInterpolations" => batched_eval_fi!,
         ),
         supports = Dict(
             "DataInterpolations" => [:uniform, :nonuniform],
@@ -232,6 +250,7 @@ const ALGORITHMS = let
             "Interpolations (gridded)" => [:uniform, :nonuniform],
             "Dierckx (k=1)" => [:uniform, :nonuniform],
             "BasicInterpolators" => [:uniform, :nonuniform],
+            "FastInterpolations" => [:uniform, :nonuniform],
         ),
     )
     d["CubicSpline"] = (
@@ -240,51 +259,69 @@ const ALGORITHMS = let
             "Interpolations (uniform)" => build_itp_cubic_uniform,
             "Dierckx (k=3)" => build_drx_cubic,
             "BasicInterpolators" => build_bi_cubic,
+            "FastInterpolations" => build_fi_cubic,
         ),
         batched! = Dict(
             "DataInterpolations" => batched_eval_di!,
             "Interpolations (uniform)" => batched_eval_itp!,
             "Dierckx (k=3)" => batched_eval_drx!,
             "BasicInterpolators" => batched_eval_bi!,
+            "FastInterpolations" => batched_eval_fi!,
         ),
         supports = Dict(
             "DataInterpolations" => [:uniform, :nonuniform],
             "Interpolations (uniform)" => [:uniform],
             "Dierckx (k=3)" => [:uniform, :nonuniform],
             "BasicInterpolators" => [:uniform, :nonuniform],
+            "FastInterpolations" => [:uniform, :nonuniform],
         ),
     )
     d["QuadraticSpline"] = (
         builders = Dict(
             "DataInterpolations" => build_di_quadratic,
             "Dierckx (k=2)" => build_drx_quadratic,
+            "FastInterpolations" => build_fi_quadratic,
         ),
         batched! = Dict(
             "DataInterpolations" => batched_eval_di!,
             "Dierckx (k=2)" => batched_eval_drx!,
+            "FastInterpolations" => batched_eval_fi!,
         ),
         supports = Dict(
             "DataInterpolations" => [:uniform, :nonuniform],
             "Dierckx (k=2)" => [:uniform, :nonuniform],
+            "FastInterpolations" => [:uniform, :nonuniform],
         ),
     )
     d["Akima"] = (
-        builders = Dict("DataInterpolations" => build_di_akima),
-        batched! = Dict("DataInterpolations" => batched_eval_di!),
-        supports = Dict("DataInterpolations" => [:uniform, :nonuniform]),
+        builders = Dict(
+            "DataInterpolations" => build_di_akima,
+            "FastInterpolations" => build_fi_akima,
+        ),
+        batched! = Dict(
+            "DataInterpolations" => batched_eval_di!,
+            "FastInterpolations" => batched_eval_fi!,
+        ),
+        supports = Dict(
+            "DataInterpolations" => [:uniform, :nonuniform],
+            "FastInterpolations" => [:uniform, :nonuniform],
+        ),
     )
     d["MonotoneCubic"] = (
         builders = Dict(
             "DataInterpolations (CubicHermite)" => build_di_cubic_hermite,
             "PCHIPInterpolation" => build_pchip,
+            "FastInterpolations (PCHIP)" => build_fi_pchip,
         ),
         batched! = Dict(
             "DataInterpolations (CubicHermite)" => batched_eval_di!,
             "PCHIPInterpolation" => batched_eval_pchip!,
+            "FastInterpolations (PCHIP)" => batched_eval_fi!,
         ),
         supports = Dict(
             "DataInterpolations (CubicHermite)" => [:uniform, :nonuniform],
             "PCHIPInterpolation" => [:uniform, :nonuniform],
+            "FastInterpolations (PCHIP)" => [:uniform, :nonuniform],
         ),
     )
     d
@@ -549,7 +586,7 @@ function write_report(path::String; total_seconds = 0.0)
         println(io, "```")
         deps = Pkg.project().dependencies
         all_info = Pkg.dependencies()
-        for pkg in ("DataInterpolations", "Interpolations", "Dierckx", "BasicInterpolators", "PCHIPInterpolation", "BenchmarkTools")
+        for pkg in ("DataInterpolations", "Interpolations", "Dierckx", "BasicInterpolators", "PCHIPInterpolation", "FastInterpolations", "BenchmarkTools")
             if haskey(deps, pkg)
                 v = all_info[deps[pkg]].version
                 println(io, "  ", pkg, " ", v)
diff --git a/bench/fast_interpolations_bench.jl b/bench/fast_interpolations_bench.jl
new file mode 100644
index 00000000..d05307fe
--- /dev/null
+++ b/bench/fast_interpolations_bench.jl
@@ -0,0 +1,383 @@
+#=
+FastInterpolations.jl benchmark, ported from their `benchmark/interpolation_benchmark.jl`
+(`ProjectTorreyPines/FastInterpolations.jl`, commit 616b106b at the time of import).
+
+This is the comparison they advertise on their README:
+  - Compares Interpolations.jl, DataInterpolations.jl, FastInterpolations.jl (+ their
+    Series interpolant), and Dierckx.jl.
+  - Workload: `mpert × mpert` independent 1D interpolants over the same uniform
+    `range(0.0, 1.0; length = npsi)` grid, evaluated at `n_eval` query points clustered
+    near psi = 0 (cubic spacing). Mimics fusion-physics matrix-of-interpolants workloads.
+  - Default config (matching their `--default`): `npsi = 64`, `mpert = 100` → 10_000
+    interpolants per package, `n_eval = 1000` query points → 10⁷ total scalar evaluations.
+
+Usage:
+    julia +1.11 --project=bench bench/fast_interpolations_bench.jl
+    julia +1.11 --project=bench bench/fast_interpolations_bench.jl --linear --small
+    julia +1.11 --project=bench bench/fast_interpolations_bench.jl --cubic --default
+
+This emits stdout-only output (no markdown report). The numbers feed the comparison
+table in `bench/cross_library_comparison.md`.
+=#
+
+import Pkg
+const BENCH_DIR = @__DIR__
+Pkg.activate(BENCH_DIR)
+
+using BenchmarkTools
+using Interpolations
+using DataInterpolations
+using FastInterpolations
+using Dierckx
+using Random
+using Printf
+using Statistics
+
+const SIZE_PRESETS = Dict(
+    :tiny => (16, 2, 5),
+    :small => (64, 5, 100),
+    :default => (64, 100, 1000),
+    :large => (64, 200, 4000),
+)
+
+const METHOD_OPTIONS = [:constant, :linear, :quadratic, :cubic]
+
+function parse_args(args)
+    size_key = :default
+    method_key = :cubic
+    for arg in args
+        if startswith(arg, "--")
+            key = Symbol(arg[3:end])
+            if haskey(SIZE_PRESETS, key)
+                size_key = key
+            elseif key in METHOD_OPTIONS
+                method_key = key
+            end
+        end
+    end
+    return size_key, method_key
+end
+
+const (SIZE_KEY, METHOD_KEY) = parse_args(ARGS)
+const (NPSI, MPERT, N_EVAL_POINTS) = SIZE_PRESETS[SIZE_KEY]
+
+function generate_test_data(npsi::Int, mpert::Int; seed::Int = 42)
+    Random.seed!(seed)
+    psi_grid = range(0.0, 1.0, length = npsi)
+    data = rand(npsi, mpert, mpert)
+    return psi_grid, data
+end
+
+function generate_evaluation_points(n_points::Int)
+    return collect(range(0.0, 1.0, length = n_points)) .^ 3
+end
+
+# ---- Interpolations.jl -----------------------------------------------------
+function init_interpolations(::Val{:linear}, psi_grid::AbstractRange, data::Array{Float64, 3})
+    _, mpert, _ = size(data)
+    first_itp = Interpolations.linear_interpolation(psi_grid, data[:, 1, 1])
+    interps = Matrix{typeof(first_itp)}(undef, mpert, mpert)
+    interps[1, 1] = first_itp
+    for m1 in 1:mpert, m2 in 1:mpert
+        (m1 == 1 && m2 == 1) && continue
+        interps[m1, m2] = Interpolations.linear_interpolation(psi_grid, data[:, m1, m2])
+    end
+    return interps
+end
+
+function init_interpolations(::Val{:cubic}, psi_grid::AbstractRange, data::Array{Float64, 3})
+    _, mpert, _ = size(data)
+    first_itp = Interpolations.cubic_spline_interpolation(psi_grid, data[:, 1, 1])
+    interps = Matrix{typeof(first_itp)}(undef, mpert, mpert)
+    interps[1, 1] = first_itp
+    for m1 in 1:mpert, m2 in 1:mpert
+        (m1 == 1 && m2 == 1) && continue
+        interps[m1, m2] = Interpolations.cubic_spline_interpolation(psi_grid, data[:, m1, m2])
+    end
+    return interps
+end
+
+function init_interpolations(::Val{:constant}, psi_grid::AbstractRange, data::Array{Float64, 3})
+    _, mpert, _ = size(data)
+    first_itp = Interpolations.constant_interpolation(psi_grid, data[:, 1, 1])
+    interps = Matrix{typeof(first_itp)}(undef, mpert, mpert)
+    interps[1, 1] = first_itp
+    for m1 in 1:mpert, m2 in 1:mpert
+        (m1 == 1 && m2 == 1) && continue
+        interps[m1, m2] = Interpolations.constant_interpolation(psi_grid, data[:, m1, m2])
+    end
+    return interps
+end
+
+function init_interpolations(::Val{:quadratic}, psi_grid::AbstractRange, data::Array{Float64, 3})
+    _, mpert, _ = size(data)
+    knots = (psi_grid,)
+    first_itp = Interpolations.extrapolate(
+        Interpolations.scale(
+            Interpolations.interpolate(
+                data[:, 1, 1],
+                Interpolations.BSpline(Interpolations.Quadratic(Interpolations.Reflect(Interpolations.OnCell()))),
+            ),
+            knots,
+        ),
+        Interpolations.Throw(),
+    )
+    interps = Matrix{typeof(first_itp)}(undef, mpert, mpert)
+    interps[1, 1] = first_itp
+    for m1 in 1:mpert, m2 in 1:mpert
+        (m1 == 1 && m2 == 1) && continue
+        interps[m1, m2] = Interpolations.extrapolate(
+            Interpolations.scale(
+                Interpolations.interpolate(
+                    data[:, m1, m2],
+                    Interpolations.BSpline(Interpolations.Quadratic(Interpolations.Reflect(Interpolations.OnCell()))),
+                ),
+                knots,
+            ),
+            Interpolations.Throw(),
+        )
+    end
+    return interps
+end
+
+# Scalar-loop and broadcast evaluators
+function eval_interpolations!(A, interps, psi)
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        A[m1, m2] = interps[m1, m2](psi)
+    end
+    return A
+end
+
+run_interpolations_loop!(A, interps, psis) = (
+    for psi in psis
+        eval_interpolations!(A, interps, psi)
+    end; A
+)
+function run_interpolations_broadcast!(A_all, interps, psis)
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        @. A_all[:, m1, m2] = interps[m1, m2](psis)
+    end
+    return A_all
+end
+
+# ---- FastInterpolations.jl -----------------------------------------------
+const FI_INIT_TABLE = Dict(
+    :linear => FastInterpolations.linear_interp,
+    :cubic => FastInterpolations.cubic_interp,
+    :quadratic => FastInterpolations.quadratic_interp,
+    :constant => FastInterpolations.constant_interp,
+)
+
+function init_fi(method::Symbol, psi_grid, data::Array{Float64, 3})
+    f = FI_INIT_TABLE[method]
+    _, mpert, _ = size(data)
+    first_itp = f(psi_grid, data[:, 1, 1])
+    interps = Matrix{typeof(first_itp)}(undef, mpert, mpert)
+    interps[1, 1] = first_itp
+    for m1 in 1:mpert, m2 in 1:mpert
+        (m1 == 1 && m2 == 1) && continue
+        interps[m1, m2] = f(psi_grid, data[:, m1, m2])
+    end
+    return interps
+end
+
+function eval_fi!(A, interps, psi)
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        A[m1, m2] = interps[m1, m2](psi)
+    end
+    return A
+end
+
+run_fi_loop!(A, interps, psis) = (
+    for psi in psis
+        eval_fi!(A, interps, psi)
+    end; A
+)
+function run_fi_vector!(A_all, interps, psis)
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        @views interps[m1, m2](A_all[:, m1, m2], psis)
+    end
+    return A_all
+end
+
+# Series API (one anchor per query, shared across series)
+function init_fi_series(method::Symbol, psi_grid, data::Array{Float64, 3})
+    f = FI_INIT_TABLE[method]
+    _, mpert, _ = size(data)
+    ys = Series([data[:, m1, m2] for m2 in 1:mpert for m1 in 1:mpert])
+    return f(psi_grid, ys)
+end
+
+run_fi_series_loop!(A, sitp, psis) = (
+    for psi in psis
+        sitp(A, psi)
+    end; A
+)
+run_fi_series_vector!(A_all, sitp, psis) = (sitp(A_all, psis); A_all)
+
+# ---- DataInterpolations.jl -----------------------------------------------
+const DI_INIT_TABLE = Dict(
+    :linear => DataInterpolations.LinearInterpolation,
+    :cubic => DataInterpolations.CubicSpline,
+    :quadratic => DataInterpolations.QuadraticInterpolation,
+    :constant => DataInterpolations.ConstantInterpolation,
+)
+
+function init_di(method::Symbol, psi_grid, data::Array{Float64, 3})
+    f = DI_INIT_TABLE[method]
+    _, mpert, _ = size(data)
+    t = collect(psi_grid)
+    first_itp = f(data[:, 1, 1], t)
+    interps = Matrix{typeof(first_itp)}(undef, mpert, mpert)
+    interps[1, 1] = first_itp
+    for m1 in 1:mpert, m2 in 1:mpert
+        (m1 == 1 && m2 == 1) && continue
+        interps[m1, m2] = f(data[:, m1, m2], t)
+    end
+    return interps
+end
+
+eval_di!(A, interps, psi) = (
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        A[m1, m2] = interps[m1, m2](psi)
+    end; A
+)
+run_di_loop!(A, interps, psis) = (
+    for psi in psis
+        eval_di!(A, interps, psi)
+    end; A
+)
+function run_di_vector!(A_all, interps, psis)
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        @views interps[m1, m2](A_all[:, m1, m2], psis)
+    end
+    return A_all
+end
+
+# ---- Dierckx.jl ---------------------------------------------------------
+function init_dierckx(method::Symbol, psi_grid, data::Array{Float64, 3})
+    method == :constant && return nothing  # Dierckx has no k=0
+    k = Dict(:linear => 1, :quadratic => 2, :cubic => 3)[method]
+    _, mpert, _ = size(data)
+    t = collect(psi_grid)
+    first_itp = Dierckx.Spline1D(t, data[:, 1, 1]; k = k, s = 0.0)
+    interps = Matrix{typeof(first_itp)}(undef, mpert, mpert)
+    interps[1, 1] = first_itp
+    for m1 in 1:mpert, m2 in 1:mpert
+        (m1 == 1 && m2 == 1) && continue
+        interps[m1, m2] = Dierckx.Spline1D(t, data[:, m1, m2]; k = k, s = 0.0)
+    end
+    return interps
+end
+
+eval_dierckx!(A, interps, psi) = (
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        A[m1, m2] = interps[m1, m2](psi)
+    end; A
+)
+run_dierckx_loop!(A, interps, psis) = (
+    for psi in psis
+        eval_dierckx!(A, interps, psi)
+    end; A
+)
+function run_dierckx_vector!(A_all, interps, psis)
+    @inbounds for m2 in axes(interps, 2), m1 in axes(interps, 1)
+        @views A_all[:, m1, m2] .= interps[m1, m2](psis)
+    end
+    return A_all
+end
+
+# ---- Driver ----------------------------------------------------------------
+function bench_one(label, f; samples = 5, evals = 2, seconds = 120)
+    f()  # warm-up
+    GC.gc()
+    b = @benchmark $f() samples = samples evals = evals seconds = seconds
+    return median(b).time / 1.0e6   # ms
+end
+
+function run_fi_bench()
+    method = METHOD_KEY
+    psi_grid, data = generate_test_data(NPSI, MPERT)
+    psis = generate_evaluation_points(N_EVAL_POINTS)
+    n_interps = MPERT * MPERT
+    total_evals = N_EVAL_POINTS * n_interps
+
+    println("="^80)
+    println("FastInterpolations.jl-style benchmark · method=$(method) · npsi=$(NPSI), mpert=$(MPERT), n_eval=$(N_EVAL_POINTS)")
+    println("Reproducing `ProjectTorreyPines/FastInterpolations.jl/benchmark/interpolation_benchmark.jl`")
+    println("="^80)
+    println()
+
+    A = Matrix{Float64}(undef, MPERT, MPERT)
+    A_all = Array{Float64, 3}(undef, N_EVAL_POINTS, MPERT, MPERT)
+    A_series = Vector{Float64}(undef, n_interps)
+    A_series_all = [Vector{Float64}(undef, N_EVAL_POINTS) for _ in 1:n_interps]
+
+    results = Dict{String, Tuple{Float64, Float64}}()  # name => (init_ms, eval_ms)
+
+    function report(name, init_ms, eval_ms)
+        results[name] = (init_ms, eval_ms)
+        total = init_ms + eval_ms
+        evs = total_evals / (eval_ms / 1.0e3)
+        return @printf("  %-44s  init %8.3f ms  eval %8.3f ms  total %8.3f ms  evals/s %.2e\n", name, init_ms, eval_ms, total, evs)
+    end
+
+    # Interpolations.jl
+    init_ms = bench_one("ITP init", () -> init_interpolations(Val(method), psi_grid, data))
+    itp_interps = init_interpolations(Val(method), psi_grid, data)
+    eval_ms = bench_one("ITP scalar", () -> run_interpolations_loop!(A, itp_interps, psis))
+    report("Interpolations.jl (scalar)", init_ms, eval_ms)
+    eval_ms = bench_one("ITP broadcast", () -> run_interpolations_broadcast!(A_all, itp_interps, psis))
+    report("Interpolations.jl (broadcast)", init_ms, eval_ms)
+
+    # FastInterpolations.jl
+    init_ms = bench_one("FI init", () -> init_fi(method, psi_grid, data))
+    fi_interps = init_fi(method, psi_grid, data)
+    eval_ms = bench_one("FI scalar", () -> run_fi_loop!(A, fi_interps, psis))
+    report("FastInterpolations.jl (scalar)", init_ms, eval_ms)
+    eval_ms = bench_one("FI vector", () -> run_fi_vector!(A_all, fi_interps, psis))
+    report("FastInterpolations.jl (vector)", init_ms, eval_ms)
+
+    # FastInterpolations Series
+    init_ms = bench_one("FI Series init", () -> init_fi_series(method, psi_grid, data))
+    sitp = init_fi_series(method, psi_grid, data)
+    eval_ms = bench_one("FI Series scalar", () -> run_fi_series_loop!(A_series, sitp, psis))
+    report("FastInterpolations.jl (Series+scalar)", init_ms, eval_ms)
+    eval_ms = bench_one("FI Series vector", () -> run_fi_series_vector!(A_series_all, sitp, psis))
+    report("FastInterpolations.jl (Series+vector)", init_ms, eval_ms)
+
+    # DataInterpolations.jl
+    init_ms = bench_one("DI init", () -> init_di(method, psi_grid, data))
+    di_interps = init_di(method, psi_grid, data)
+    eval_ms = bench_one("DI scalar", () -> run_di_loop!(A, di_interps, psis))
+    report("DataInterpolations.jl (scalar)", init_ms, eval_ms)
+    eval_ms = bench_one("DI vector", () -> run_di_vector!(A_all, di_interps, psis))
+    report("DataInterpolations.jl (vector)", init_ms, eval_ms)
+
+    # Dierckx (if applicable)
+    if method != :constant
+        init_ms = bench_one("Dierckx init", () -> init_dierckx(method, psi_grid, data))
+        drx_interps = init_dierckx(method, psi_grid, data)
+        eval_ms = bench_one("Dierckx scalar", () -> run_dierckx_loop!(A, drx_interps, psis))
+        report("Dierckx.jl (scalar)", init_ms, eval_ms)
+        eval_ms = bench_one("Dierckx vector", () -> run_dierckx_vector!(A_all, drx_interps, psis))
+        report("Dierckx.jl (vector)", init_ms, eval_ms)
+    end
+
+    # Summary
+    println()
+    println("="^80)
+    println("Summary: speedup vs DataInterpolations.jl (scalar)")
+    println("="^80)
+    baseline_total = sum(results["DataInterpolations.jl (scalar)"])
+    @printf("  %-44s  %10s  %10s  %10s  %s\n", "Package", "Init (ms)", "Eval (ms)", "Total (ms)", "Speedup")
+    for (name, (init_ms, eval_ms)) in sort(collect(results); by = x -> sum(x[2]))
+        total = init_ms + eval_ms
+        @printf("  %-44s  %10.3f  %10.3f  %10.3f  %.2fx\n", name, init_ms, eval_ms, total, baseline_total / total)
+    end
+    println()
+
+    return results
+end
+
+run_fi_bench()

From 6a5f7e96357c430cad50c621101de4c944e99b1d Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 16:59:30 -0400
Subject: [PATCH 07/24] Update cross-library bench with FastInterpolations
 results + findings
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Full sweep (4.4 min, n ∈ {100, 1k, 10k, 100k}, m ∈ {1, 10, 1k, 100k},
both uniform and non-uniform grids) regenerated with FastInterpolations
included. Plus a `FastInterpolations.jl advertised benchmark` section
running the matrix-of-interpolants workload they publish on their README
(cubic spline + linear at npsi=64, mpert=100, n_eval=1000), and a
`Findings` section explaining where FastInterpolations beats DI, where DI
matches, and which gaps are out of scope for this PR.

Summary of findings:
  - FastInterpolations.jl Series API is 70-100× faster on matrix-of-
    interpolants workloads — they compute the cell anchor once per query
    and reuse it across thousands of coefficient series. No equivalent in
    DI; would need a separate `SeriesInterpolation` type proposal.
  - Per-query scalar latency on `Vector{Float64}` grids: DI ~100-200 ns,
    FI ~50 ns. The gap is `Auto(props)` dispatch overhead vs FI's direct
    `_search_direct(::_CachedRange, q)` (which compiles to ~3 instructions).
    Closeable in a follow-up by resolving Auto to a concrete strategy at
    construction time.
  - Non-uniform CubicSpline/Akima construction: DI within ~30% of FI at
    n ≥ 10k thanks to the O(n) `spline_coefficients!` fix on this branch.
  - Sorted-batch on non-uniform: DI competitive at large m.

Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 bench/cross_library_comparison.md | 290 +++++++++++++++++++++---------
 1 file changed, 201 insertions(+), 89 deletions(-)

diff --git a/bench/cross_library_comparison.md b/bench/cross_library_comparison.md
index b964581d..0d98f8d5 100644
--- a/bench/cross_library_comparison.md
+++ b/bench/cross_library_comparison.md
@@ -17,7 +17,7 @@ Threads: 1 default, 0 interactive, 1 GC (on 128 virtual cores)
 
 Bench harness: `BenchmarkTools.@benchmark` with `evals=1`, max samples=100, max seconds=0.5.
 
-Commit: `e22f5d6a6fa8d72079b33209b910b9504c4cadde`
+Commit: `3ce1080447eb29b4f51ef363bbad4129e00b176a`
 
 Library versions:
 ```
@@ -26,28 +26,11 @@ Library versions:
   Dierckx 0.5.4
   BasicInterpolators 0.7.1
   PCHIPInterpolation 0.2.1
+  FastInterpolations 0.4.11
   BenchmarkTools 1.8.0
 ```
 
-Total bench time: 353.5 s
-
-## Headline findings
-
-These numbers are taken directly from the tables below. All cells are medians from `BenchmarkTools.@benchmark evals=1` runs.
-
-- **Sorted-batch + cached `Auto(t_props)` is DI's biggest cross-library win.** At cubic spline n=100 000, m=100 000 (sorted batch, uniform knots), DI evaluates in **1.78 ms** vs Dierckx 3.16 s (~**1 770× faster**), BasicInterpolators 7.94 ms (~**4.5× faster**), and PCHIP at n=100k m=100k (sorted) 9.70 ms (~**5.3× faster** for monotone cubic). The only library that beats DI on this row is **Interpolations.jl's uniform constructor (2.06 ms, ~16% faster)** because it uses O(1) uniform-grid index lookup; DI still wins against every non-uniform-capable competitor. At linear n=100k m=100k sorted batch, DI is **1.64 ms** vs Dierckx 3.18 s (~**1 940×**) and BasicInterpolators 7.89 ms (~**4.8×**).
-
-- **`Auto(t_props)` also dominates the random / unsorted-batch case** because the cached search-property is re-used on every evaluation, not re-probed. At cubic n=100k m=100k *random* batch, DI is **6.87 ms** vs Dierckx 3.15 s (~**460×**), BasicInterpolators 19.8 ms (~**2.9×**); Interpolations(uniform) is still ahead at 2.06 ms (O(1) index). Even at random unsorted access, DI competes with — and on every non-uniform library beats — the alternatives.
-
-- **DI wins the chained ODE-style case decisively at large n.** Cubic spline, n=100k, m=1000 monotone chain: DI **69.6 μs** vs Dierckx 31.5 ms (~**450×**), BasicInterpolators 137 μs (~**2.0×**). MonotoneCubic chained, n=100k m=1000: DI 71.9 μs vs PCHIPInterpolation 149 μs (~**2.1×**). This is exactly the workload DI's `iguesser` was designed for; libraries without hint-chaining (Dierckx, BasicInterpolators, PCHIP) lose by ~2× to ~450×.
-
-- **Where DI loses on small m or single-eval:** single-query cubic at n=100k is 80 ns (DI) vs 50 ns (BasicInterpolators) and 70 ns (Interpolations uniform) — within ~1.5×, but consistently slightly slower because DI does a real index lookup whereas the others can use a one-shot uniform divide. At `sorted batch m=10 / n=10000` linear, DI is 500 ns vs Interpolations(uniform) 120 ns (4×) because DI's sorted-batch fast-path uses an O(m log n) per-element bisect plus allocates a small idx buffer; at this very small m the buffer alloc overhead dominates.
-
-- **DI QuadraticSpline is a clear loser, by ~2-5× across the board.** At n=100k construction DI takes **7.0 s** vs Dierckx 13.9 ms (~**500× slower**). At n=10k construction DI is 65.7 ms vs Dierckx 1.37 ms (~48×). Inspection traces this to `quadratic_spline_params` calling `spline_coefficients!` which does `findfirst(x -> x > u, k)` — a linear scan inside a loop over `n` knots, making the QuadraticSpline constructor **O(n²)**. The QuadraticSpline single-query at n=100k is also 60-110 μs (vs Dierckx 13-55 μs) and the batched evaluators at n=100k m=100k cost 7.0 s (vs Dierckx 3.2 s). This is the most actionable finding in the entire report.
-
-- **DI CubicHermiteSpline (used here as PCHIP analogue) beats PCHIPInterpolation.jl on every batched cell.** Sorted batch n=100k m=100k: DI 1.83 ms vs PCHIP 9.70 ms (~5.3×). Random batch n=100k m=100k: DI 7.28 ms vs PCHIP 20.4 ms (~2.8×). Chained n=100k m=1000: DI 72 μs vs PCHIP 149 μs (~2.1×). Construction is also slightly faster across all n.
-
-- **`Interpolations.jl`'s `cubic_spline_interpolation` / `linear_interpolation` over a `range` is the ceiling we're chasing on uniform data.** Because it does O(1) index lookup, it beats DI on every uniform-grid case where the lookup cost dominates: linear n=100k single-query 60 ns (DI 80 ns), linear sorted-batch n=100k m=100k 658 μs (DI 1.64 ms, ~2.5×), cubic sorted-batch n=100k m=100k 2.06 ms (DI 1.78 ms — DI wins here). It cannot handle non-uniform cubic at all; it falls back to `Gridded(Linear)` only. So the comparison is really "DI generalised to non-uniform & O(log n) lookup" vs "Interpolations specialised to uniform & O(1) lookup."
+Total bench time: 261.4 s
 
 ## Construction time
 
@@ -57,40 +40,45 @@ Rows = library, columns = (n, knot pattern). Values = median wall time (IQR).
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 2.195 μs (IQR 320.000 ns) | 2.285 μs (IQR 427.500 ns) | 31.189 μs (IQR 4.425 μs) | 44.820 μs (IQR 6.655 μs) | 117.964 μs (IQR 1.608 μs) | 182.268 μs (IQR 233.136 μs) | 1.203 ms (IQR 55.989 μs) | 1.269 ms (IQR 42.470 μs) | 
+| DataInterpolations | 1.895 μs (IQR 267.500 ns) | 1.935 μs (IQR 255.000 ns) | 12.340 μs (IQR 552.500 ns) | 13.625 μs (IQR 31.997 μs) | 96.769 μs (IQR 892.500 ns) | 105.959 μs (IQR 160.974 μs) | 966.061 μs (IQR 2.906 ms) | 1.065 ms (IQR 2.945 ms) | 
+| FastInterpolations | 1.320 μs (IQR 422.500 ns) | 990.000 ns (IQR 310.000 ns) | 10.680 μs (IQR 39.707 μs) | 29.840 μs (IQR 7.692 μs) | 69.779 μs (IQR 424.373 μs) | 173.559 μs (IQR 78.677 μs) | 680.669 μs (IQR 35.064 μs) | 673.078 μs (IQR 25.835 μs) | 
 
 ### CubicSpline
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 7.450 μs (IQR 3.060 μs) | 6.880 μs (IQR 675.000 ns) | 56.620 μs (IQR 3.062 μs) | 60.729 μs (IQR 26.519 μs) | 507.370 μs (IQR 9.600 μs) | 580.565 μs (IQR 948.358 μs) | 5.510 ms (IQR 1.113 ms) | 5.229 ms (IQR 863.691 μs) | 
-| BasicInterpolators | 4.305 μs (IQR 542.500 ns) | 4.430 μs (IQR 475.000 ns) | 37.569 μs (IQR 2.132 μs) | 39.330 μs (IQR 4.598 μs) | 714.473 μs (IQR 401.371 μs) | 1.025 ms (IQR 714.324 μs) | 3.287 ms (IQR 894.667 μs) | 3.315 ms (IQR 848.164 μs) | 
-| Dierckx (k=3) | 17.674 μs (IQR 739.250 ns) | 17.600 μs (IQR 1.215 μs) | 208.738 μs (IQR 51.890 μs) | 212.863 μs (IQR 6.742 μs) | 1.608 ms (IQR 84.278 μs) | 1.745 ms (IQR 548.674 μs) | 17.461 ms (IQR 6.682 ms) | 18.954 ms (IQR 6.357 ms) | 
-| Interpolations (uniform) | — | 15.274 μs (IQR 734.250 ns) | — | 137.884 μs (IQR 19.681 μs) | — | 1.442 ms (IQR 464.458 μs) | — | 8.195 ms (IQR 134.718 μs) | 
+| DataInterpolations | 6.930 μs (IQR 3.364 μs) | 7.170 μs (IQR 3.487 μs) | 55.215 μs (IQR 1.649 μs) | 57.094 μs (IQR 44.369 μs) | 482.461 μs (IQR 3.031 μs) | 495.015 μs (IQR 981.821 μs) | 5.001 ms (IQR 2.172 ms) | 5.070 ms (IQR 893.747 μs) | 
+| BasicInterpolators | 4.340 μs (IQR 530.000 ns) | 4.385 μs (IQR 722.500 ns) | 37.880 μs (IQR 1.177 μs) | 39.015 μs (IQR 2.552 μs) | 319.082 μs (IQR 3.510 μs) | 1.021 ms (IQR 696.255 μs) | 3.258 ms (IQR 864.505 μs) | 3.324 ms (IQR 835.567 μs) | 
+| Dierckx (k=3) | 23.020 μs (IQR 1.680 μs) | 17.440 μs (IQR 495.000 ns) | 209.343 μs (IQR 50.807 μs) | 211.203 μs (IQR 27.988 μs) | 1.582 ms (IQR 93.580 μs) | 1.723 ms (IQR 687.644 μs) | 18.212 ms (IQR 5.298 ms) | 20.038 ms (IQR 5.815 ms) | 
+| FastInterpolations | 1.760 μs (IQR 285.000 ns) | 1.400 μs (IQR 235.000 ns) | 14.395 μs (IQR 495.000 ns) | 11.440 μs (IQR 515.000 ns) | 128.024 μs (IQR 1.032 μs) | 101.614 μs (IQR 1.115 μs) | 1.280 ms (IQR 242.824 μs) | 1.010 ms (IQR 29.291 μs) | 
+| Interpolations (uniform) | — | 15.339 μs (IQR 1.022 μs) | — | 130.319 μs (IQR 9.140 μs) | — | 1.470 ms (IQR 311.781 μs) | — | 8.529 ms (IQR 384.982 μs) | 
 
 ### Linear
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 1.260 μs (IQR 185.000 ns) | 1.450 μs (IQR 267.500 ns) | 10.200 μs (IQR 320.250 ns) | 11.110 μs (IQR 354.250 ns) | 92.584 μs (IQR 826.750 ns) | 101.064 μs (IQR 967.500 ns) | 930.192 μs (IQR 9.795 μs) | 998.760 μs (IQR 7.260 μs) | 
-| BasicInterpolators | 1.190 μs (IQR 212.500 ns) | 1.290 μs (IQR 235.000 ns) | 7.905 μs (IQR 505.000 ns) | 8.960 μs (IQR 1.292 μs) | 59.559 μs (IQR 1.714 μs) | 67.840 μs (IQR 1.940 μs) | 594.784 μs (IQR 9.875 μs) | 671.909 μs (IQR 10.883 μs) | 
-| Dierckx (k=1) | 11.919 μs (IQR 2.472 μs) | 12.485 μs (IQR 1.991 μs) | 79.025 μs (IQR 2.056 μs) | 108.474 μs (IQR 14.793 μs) | 790.987 μs (IQR 114.966 μs) | 1.019 ms (IQR 266.517 μs) | 7.557 ms (IQR 622.339 μs) | 7.581 ms (IQR 727.211 μs) | 
-| Interpolations (gridded) | 940.000 ns (IQR 162.500 ns) | 1.030 μs (IQR 222.500 ns) | 7.580 μs (IQR 537.250 ns) | 11.495 μs (IQR 10.139 μs) | 64.489 μs (IQR 977.500 ns) | 147.218 μs (IQR 76.435 μs) | 630.804 μs (IQR 14.617 μs) | 723.713 μs (IQR 18.942 μs) | 
-| Interpolations (uniform) | — | 215.000 ns (IQR 142.500 ns) | — | 3.204 μs (IQR 1.998 μs) | — | 22.045 μs (IQR 4.760 μs) | — | 75.369 μs (IQR 8.617 μs) | 
+| DataInterpolations | 905.000 ns (IQR 250.000 ns) | 1.030 μs (IQR 162.500 ns) | 7.020 μs (IQR 412.500 ns) | 7.835 μs (IQR 300.250 ns) | 60.794 μs (IQR 1.147 μs) | 69.284 μs (IQR 679.750 ns) | 602.635 μs (IQR 3.941 μs) | 684.534 μs (IQR 5.035 μs) | 
+| BasicInterpolators | 1.170 μs (IQR 350.000 ns) | 1.320 μs (IQR 262.500 ns) | 8.145 μs (IQR 600.000 ns) | 9.035 μs (IQR 1.195 μs) | 61.674 μs (IQR 2.082 μs) | 70.815 μs (IQR 2.756 μs) | 610.510 μs (IQR 9.142 μs) | 696.798 μs (IQR 5.480 μs) | 
+| Dierckx (k=1) | 9.309 μs (IQR 580.000 ns) | 12.405 μs (IQR 2.297 μs) | 79.575 μs (IQR 2.900 μs) | 106.234 μs (IQR 10.303 μs) | 764.703 μs (IQR 21.014 μs) | 764.083 μs (IQR 13.045 μs) | 7.486 ms (IQR 1.087 ms) | 7.568 ms (IQR 922.522 μs) | 
+| FastInterpolations | 1.015 μs (IQR 402.500 ns) | 330.000 ns (IQR 212.500 ns) | 7.410 μs (IQR 2.632 μs) | 2.100 μs (IQR 347.500 ns) | 45.944 μs (IQR 3.295 μs) | 15.395 μs (IQR 1.893 μs) | 429.641 μs (IQR 24.649 μs) | 137.569 μs (IQR 2.454 μs) | 
+| Interpolations (gridded) | 875.000 ns (IQR 245.000 ns) | 970.000 ns (IQR 245.000 ns) | 7.385 μs (IQR 477.500 ns) | 9.085 μs (IQR 9.578 μs) | 60.604 μs (IQR 1.885 μs) | 69.745 μs (IQR 1.954 μs) | 596.539 μs (IQR 5.037 μs) | 682.029 μs (IQR 5.189 μs) | 
+| Interpolations (uniform) | — | 165.000 ns (IQR 165.000 ns) | — | 3.040 μs (IQR 2.235 μs) | — | 23.445 μs (IQR 5.530 μs) | — | 68.814 μs (IQR 2.921 μs) | 
 
 ### MonotoneCubic
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations (CubicHermite) | 1.400 μs (IQR 222.500 ns) | 1.545 μs (IQR 292.500 ns) | 10.195 μs (IQR 500.000 ns) | 11.000 μs (IQR 448.250 ns) | 87.144 μs (IQR 975.250 ns) | 94.999 μs (IQR 670.000 ns) | 868.637 μs (IQR 11.227 μs) | 953.866 μs (IQR 14.377 μs) | 
-| PCHIPInterpolation | 1.660 μs (IQR 420.000 ns) | 1.780 μs (IQR 452.500 ns) | 13.255 μs (IQR 960.500 ns) | 14.490 μs (IQR 1.624 μs) | 109.594 μs (IQR 1.990 μs) | 116.719 μs (IQR 1.327 μs) | 1.092 ms (IQR 21.902 μs) | 1.181 ms (IQR 35.152 μs) | 
+| DataInterpolations (CubicHermite) | 1.210 μs (IQR 245.000 ns) | 1.260 μs (IQR 312.500 ns) | 8.205 μs (IQR 472.500 ns) | 8.970 μs (IQR 552.500 ns) | 66.989 μs (IQR 899.500 ns) | 155.944 μs (IQR 2.865 μs) | 667.664 μs (IQR 11.177 μs) | 760.448 μs (IQR 1.507 ms) | 
+| FastInterpolations (PCHIP) | 1.980 μs (IQR 395.000 ns) | 1.245 μs (IQR 262.500 ns) | 15.105 μs (IQR 837.500 ns) | 10.855 μs (IQR 550.000 ns) | 116.039 μs (IQR 425.011 μs) | 93.414 μs (IQR 1.335 μs) | 1.148 ms (IQR 64.792 μs) | 925.542 μs (IQR 1.909 ms) | 
+| PCHIPInterpolation | 1.590 μs (IQR 302.500 ns) | 1.685 μs (IQR 352.500 ns) | 13.275 μs (IQR 790.000 ns) | 14.570 μs (IQR 890.000 ns) | 150.029 μs (IQR 157.078 μs) | 118.489 μs (IQR 12.057 μs) | 1.100 ms (IQR 1.930 ms) | 1.195 ms (IQR 2.849 ms) | 
 
 ### QuadraticSpline
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 16.825 μs (IQR 904.250 ns) | 16.880 μs (IQR 865.750 ns) | 744.113 μs (IQR 19.005 μs) | 766.238 μs (IQR 39.012 μs) | 65.719 ms (IQR 401.579 μs) | 66.057 ms (IQR 689.417 μs) | 6.978 s (IQR 0.000 ns) | 7.028 s (IQR 0.000 ns) | 
-| Dierckx (k=2) | 18.560 μs (IQR 1.295 μs) | 17.700 μs (IQR 3.228 μs) | 137.524 μs (IQR 1.077 μs) | 175.948 μs (IQR 8.215 μs) | 1.371 ms (IQR 61.880 μs) | 1.583 ms (IQR 193.173 μs) | 13.906 ms (IQR 997.231 μs) | 13.571 ms (IQR 1.787 ms) | 
+| DataInterpolations | 9.420 μs (IQR 661.750 ns) | 9.455 μs (IQR 750.000 ns) | 84.669 μs (IQR 997.750 ns) | 96.034 μs (IQR 61.307 μs) | 800.123 μs (IQR 10.530 μs) | 823.987 μs (IQR 668.939 μs) | 8.070 ms (IQR 3.777 ms) | 8.209 ms (IQR 5.391 ms) | 
+| Dierckx (k=2) | 15.485 μs (IQR 680.000 ns) | 21.090 μs (IQR 3.221 μs) | 136.554 μs (IQR 1.056 μs) | 143.228 μs (IQR 16.675 μs) | 1.353 ms (IQR 164.550 μs) | 1.356 ms (IQR 155.038 μs) | 13.384 ms (IQR 4.032 ms) | 14.377 ms (IQR 3.926 ms) | 
+| FastInterpolations | 1.430 μs (IQR 420.000 ns) | 715.000 ns (IQR 342.500 ns) | 10.325 μs (IQR 740.000 ns) | 5.210 μs (IQR 485.750 ns) | 70.434 μs (IQR 420.084 μs) | 38.454 μs (IQR 2.993 μs) | 702.374 μs (IQR 38.012 μs) | 372.171 μs (IQR 33.597 μs) | 
 
 ## Single-query latency
 
@@ -100,40 +88,45 @@ Cold single evaluation `A(x_query)`. Rows = library, columns = (n, knot pattern)
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 90.000 ns (IQR 10.000 ns) | 75.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 
+| DataInterpolations | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 10.000 ns) | 90.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 2.500 ns) | 100.000 ns (IQR 10.000 ns) | 
+| FastInterpolations | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 
 
 ### CubicSpline
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 80.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 0.000 ns) | 
-| BasicInterpolators | 50.000 ns (IQR 0.000 ns) | 50.000 ns (IQR 0.000 ns) | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 0.000 ns) | 65.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 
-| Dierckx (k=3) | 160.000 ns (IQR 10.000 ns) | 160.000 ns (IQR 10.000 ns) | 390.000 ns (IQR 10.000 ns) | 400.000 ns (IQR 10.000 ns) | 2.780 μs (IQR 0.000 ns) | 2.790 μs (IQR 10.000 ns) | 26.750 μs (IQR 40.000 ns) | 26.650 μs (IQR 89.250 ns) | 
+| DataInterpolations | 80.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 0.000 ns) | 110.000 ns (IQR 0.000 ns) | 110.000 ns (IQR 10.000 ns) | 
+| BasicInterpolators | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 2.500 ns) | 60.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 90.000 ns (IQR 10.000 ns) | 
+| Dierckx (k=3) | 150.000 ns (IQR 0.000 ns) | 150.000 ns (IQR 10.000 ns) | 380.000 ns (IQR 10.000 ns) | 400.000 ns (IQR 10.000 ns) | 2.789 μs (IQR 10.000 ns) | 2.790 μs (IQR 10.000 ns) | 26.760 μs (IQR 51.000 ns) | 26.680 μs (IQR 40.000 ns) | 
+| FastInterpolations | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 50.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 50.000 ns (IQR 10.000 ns) | 
 | Interpolations (uniform) | — | 80.000 ns (IQR 10.000 ns) | — | 80.000 ns (IQR 10.000 ns) | — | 80.000 ns (IQR 0.000 ns) | — | 80.000 ns (IQR 10.000 ns) | 
 
 ### Linear
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 0.000 ns) | 
-| BasicInterpolators | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 0.000 ns) | 
-| Dierckx (k=1) | 120.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 10.000 ns) | 350.000 ns (IQR 0.000 ns) | 370.000 ns (IQR 10.000 ns) | 2.760 μs (IQR 0.000 ns) | 2.770 μs (IQR 10.000 ns) | 26.729 μs (IQR 42.250 ns) | 26.630 μs (IQR 72.500 ns) | 
-| Interpolations (gridded) | 60.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 10.000 ns) | 
+| DataInterpolations | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 10.000 ns) | 
+| BasicInterpolators | 60.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 
+| Dierckx (k=1) | 120.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 10.000 ns) | 350.000 ns (IQR 0.000 ns) | 370.000 ns (IQR 10.000 ns) | 2.750 μs (IQR 10.000 ns) | 2.750 μs (IQR 10.000 ns) | 26.720 μs (IQR 40.250 ns) | 26.650 μs (IQR 42.500 ns) | 
+| FastInterpolations | 50.000 ns (IQR 0.000 ns) | 40.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 40.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 10.000 ns) | 40.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 40.000 ns (IQR 10.000 ns) | 
+| Interpolations (gridded) | 60.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 70.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 10.000 ns) | 
 | Interpolations (uniform) | — | 60.000 ns (IQR 0.000 ns) | — | 60.000 ns (IQR 0.000 ns) | — | 60.000 ns (IQR 0.000 ns) | — | 60.000 ns (IQR 0.000 ns) | 
 
 ### MonotoneCubic
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations (CubicHermite) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 
-| PCHIPInterpolation | 70.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 
+| DataInterpolations (CubicHermite) | 90.000 ns (IQR 10.000 ns) | 90.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 0.000 ns) | 100.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 0.000 ns) | 
+| FastInterpolations (PCHIP) | 50.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 60.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 0.000 ns) | 
+| PCHIPInterpolation | 60.000 ns (IQR 10.000 ns) | 70.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 10.000 ns) | 80.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 110.000 ns (IQR 10.000 ns) | 100.000 ns (IQR 0.000 ns) | 
 
 ### QuadraticSpline
 
 | Library | n=100,nonuniform | n=100,uniform | n=1000,nonuniform | n=1000,uniform | n=10000,nonuniform | n=10000,uniform | n=100000,nonuniform | n=100000,uniform | 
 |---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 180.000 ns (IQR 0.000 ns) | 190.000 ns (IQR 10.000 ns) | 660.000 ns (IQR 10.000 ns) | 710.000 ns (IQR 10.000 ns) | 5.810 μs (IQR 10.000 ns) | 5.820 μs (IQR 19.000 ns) | 62.569 μs (IQR 243.500 ns) | 62.474 μs (IQR 163.250 ns) | 
-| Dierckx (k=2) | 140.000 ns (IQR 0.000 ns) | 170.000 ns (IQR 32.500 ns) | 370.000 ns (IQR 0.000 ns) | 390.000 ns (IQR 0.000 ns) | 2.780 μs (IQR 10.000 ns) | 2.780 μs (IQR 10.000 ns) | 26.739 μs (IQR 73.250 ns) | 26.670 μs (IQR 59.000 ns) | 
+| DataInterpolations | 160.000 ns (IQR 10.000 ns) | 160.000 ns (IQR 10.000 ns) | 250.000 ns (IQR 0.000 ns) | 260.000 ns (IQR 0.000 ns) | 1.240 μs (IQR 10.000 ns) | 1.240 μs (IQR 10.000 ns) | 14.540 μs (IQR 100.000 ns) | 14.464 μs (IQR 59.000 ns) | 
+| Dierckx (k=2) | 130.000 ns (IQR 10.000 ns) | 140.000 ns (IQR 10.000 ns) | 370.000 ns (IQR 10.000 ns) | 390.000 ns (IQR 0.000 ns) | 2.780 μs (IQR 10.000 ns) | 2.780 μs (IQR 0.000 ns) | 26.719 μs (IQR 59.000 ns) | 26.630 μs (IQR 43.250 ns) | 
+| FastInterpolations | 50.000 ns (IQR 10.000 ns) | 40.000 ns (IQR 10.000 ns) | 50.000 ns (IQR 2.500 ns) | 40.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 10.000 ns) | 40.000 ns (IQR 10.000 ns) | 60.000 ns (IQR 2.500 ns) | 40.000 ns (IQR 10.000 ns) | 
 
 ## Sorted batch
 
@@ -143,40 +136,45 @@ Cold single evaluation `A(x_query)`. Rows = library, columns = (n, knot pattern)
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 110.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 10.000 ns) | 4.900 μs (IQR 1.530 μs) | 323.432 μs (IQR 2.525 μs) | 120.000 ns (IQR 0.000 ns) | 340.000 ns (IQR 10.000 ns) | 5.195 μs (IQR 30.000 ns) | 341.772 μs (IQR 1.866 μs) | 120.000 ns (IQR 10.000 ns) | 430.000 ns (IQR 10.000 ns) | 12.070 μs (IQR 412.500 ns) | 479.050 μs (IQR 9.502 μs) | 140.000 ns (IQR 10.000 ns) | 510.000 ns (IQR 10.000 ns) | 140.203 μs (IQR 1.752 μs) | 1.436 ms (IQR 26.067 μs) | 
+| DataInterpolations | 120.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 0.000 ns) | 4.010 μs (IQR 0.000 ns) | 364.582 μs (IQR 1.153 μs) | 120.000 ns (IQR 10.000 ns) | 360.000 ns (IQR 0.000 ns) | 5.350 μs (IQR 20.000 ns) | 387.027 μs (IQR 2.195 μs) | 130.000 ns (IQR 10.000 ns) | 430.000 ns (IQR 10.000 ns) | 13.874 μs (IQR 683.250 ns) | 521.981 μs (IQR 3.110 μs) | 140.000 ns (IQR 10.000 ns) | 540.000 ns (IQR 10.000 ns) | 141.629 μs (IQR 2.840 μs) | 1.442 ms (IQR 10.085 μs) | 
+| FastInterpolations | 60.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 10.000 ns) | 11.190 μs (IQR 41.000 ns) | 1.074 ms (IQR 22.070 μs) | 60.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 10.000 ns) | 11.170 μs (IQR 11.000 ns) | 1.070 ms (IQR 11.035 μs) | 60.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 10.000 ns) | 11.190 μs (IQR 50.000 ns) | 1.072 ms (IQR 7.127 μs) | 60.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 10.000 ns) | 11.884 μs (IQR 411.500 ns) | 1.075 ms (IQR 6.483 μs) | 
 
 ### CubicSpline
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 130.000 ns (IQR 10.000 ns) | 200.000 ns (IQR 10.000 ns) | 10.030 μs (IQR 20.000 ns) | 975.096 μs (IQR 13.203 μs) | 130.000 ns (IQR 0.000 ns) | 420.000 ns (IQR 10.000 ns) | 9.920 μs (IQR 20.000 ns) | 973.951 μs (IQR 22.567 μs) | 140.000 ns (IQR 10.000 ns) | 490.000 ns (IQR 10.000 ns) | 15.420 μs (IQR 50.000 ns) | 1.019 ms (IQR 9.423 μs) | 140.000 ns (IQR 10.000 ns) | 580.000 ns (IQR 10.000 ns) | 151.668 μs (IQR 4.980 μs) | 1.779 ms (IQR 21.049 μs) | 
-| BasicInterpolators | 70.000 ns (IQR 10.000 ns) | 180.000 ns (IQR 10.000 ns) | 16.315 μs (IQR 302.500 ns) | 1.369 ms (IQR 19.600 μs) | 70.000 ns (IQR 0.000 ns) | 240.000 ns (IQR 0.000 ns) | 42.385 μs (IQR 948.500 ns) | 2.034 ms (IQR 21.232 μs) | 70.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 10.000 ns) | 79.069 μs (IQR 1.113 μs) | 4.233 ms (IQR 66.511 μs) | 80.000 ns (IQR 0.000 ns) | 370.000 ns (IQR 10.000 ns) | 130.333 μs (IQR 2.495 μs) | 7.938 ms (IQR 43.734 μs) | 
-| Dierckx (k=3) | 190.000 ns (IQR 0.000 ns) | 1.220 μs (IQR 0.000 ns) | 121.929 μs (IQR 30.250 ns) | 11.761 ms (IQR 53.174 μs) | 710.000 ns (IQR 10.000 ns) | 3.620 μs (IQR 0.250 ns) | 408.796 μs (IQR 188.500 ns) | 41.214 ms (IQR 255.653 μs) | 5.710 μs (IQR 10.000 ns) | 26.890 μs (IQR 20.000 ns) | 3.210 ms (IQR 28.301 μs) | 323.867 ms (IQR 20.851 μs) | 55.660 μs (IQR 70.000 ns) | 260.212 μs (IQR 242.250 ns) | 31.300 ms (IQR 245.060 μs) | 3.157 s (IQR 0.000 ns) | 
-| Interpolations (uniform) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.469 μs (IQR 10.000 ns) | 2.050 ms (IQR 13.412 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.460 μs (IQR 1.000 ns) | 2.050 ms (IQR 13.490 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.460 μs (IQR 30.000 ns) | 2.050 ms (IQR 11.105 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.450 μs (IQR 20.000 ns) | 2.057 ms (IQR 21.207 μs) | 
+| DataInterpolations | 130.000 ns (IQR 10.000 ns) | 210.000 ns (IQR 0.000 ns) | 10.380 μs (IQR 10.000 ns) | 1.002 ms (IQR 6.160 μs) | 130.000 ns (IQR 10.000 ns) | 410.000 ns (IQR 10.000 ns) | 10.220 μs (IQR 10.000 ns) | 1.007 ms (IQR 5.220 μs) | 140.000 ns (IQR 10.000 ns) | 495.000 ns (IQR 10.000 ns) | 15.790 μs (IQR 144.750 ns) | 1.050 ms (IQR 5.147 μs) | 150.000 ns (IQR 10.000 ns) | 570.000 ns (IQR 10.000 ns) | 153.254 μs (IQR 2.850 μs) | 1.787 ms (IQR 11.688 μs) | 
+| BasicInterpolators | 60.000 ns (IQR 0.000 ns) | 200.000 ns (IQR 10.000 ns) | 16.920 μs (IQR 371.000 ns) | 1.402 ms (IQR 29.020 μs) | 70.000 ns (IQR 0.000 ns) | 250.000 ns (IQR 10.000 ns) | 43.025 μs (IQR 2.495 μs) | 2.069 ms (IQR 40.005 μs) | 70.000 ns (IQR 10.000 ns) | 310.000 ns (IQR 0.000 ns) | 79.704 μs (IQR 4.163 μs) | 4.140 ms (IQR 15.742 μs) | 80.000 ns (IQR 0.000 ns) | 370.000 ns (IQR 0.000 ns) | 126.109 μs (IQR 1.827 μs) | 7.865 ms (IQR 77.216 μs) | 
+| Dierckx (k=3) | 190.000 ns (IQR 10.000 ns) | 1.220 μs (IQR 0.000 ns) | 121.679 μs (IQR 62.500 ns) | 11.733 ms (IQR 34.135 μs) | 700.000 ns (IQR 0.000 ns) | 3.620 μs (IQR 0.000 ns) | 408.256 μs (IQR 72.500 ns) | 40.985 ms (IQR 72.560 μs) | 5.690 μs (IQR 30.000 ns) | 26.920 μs (IQR 39.250 ns) | 3.202 ms (IQR 4.645 μs) | 322.833 ms (IQR 90.359 μs) | 55.620 μs (IQR 110.000 ns) | 260.202 μs (IQR 173.500 ns) | 31.267 ms (IQR 222.842 μs) | 3.164 s (IQR 0.000 ns) | 
+| FastInterpolations | 60.000 ns (IQR 2.500 ns) | 150.000 ns (IQR 0.000 ns) | 8.860 μs (IQR 0.000 ns) | 843.207 μs (IQR 12.260 μs) | 60.000 ns (IQR 0.000 ns) | 140.000 ns (IQR 10.000 ns) | 8.980 μs (IQR 1.000 ns) | 846.997 μs (IQR 6.682 μs) | 60.000 ns (IQR 2.500 ns) | 150.000 ns (IQR 0.000 ns) | 8.950 μs (IQR 42.500 ns) | 846.477 μs (IQR 4.218 μs) | 70.000 ns (IQR 20.000 ns) | 150.000 ns (IQR 10.000 ns) | 9.525 μs (IQR 69.250 ns) | 849.188 μs (IQR 10.038 μs) | 
+| Interpolations (uniform) | 90.000 ns (IQR 2.500 ns) | 270.000 ns (IQR 0.000 ns) | 20.460 μs (IQR 10.000 ns) | 2.046 ms (IQR 8.038 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.460 μs (IQR 1.000 ns) | 2.047 ms (IQR 9.498 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.440 μs (IQR 19.000 ns) | 2.047 ms (IQR 7.382 μs) | 90.000 ns (IQR 0.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.440 μs (IQR 31.000 ns) | 2.049 ms (IQR 10.880 μs) | 
 
 ### Linear
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 120.000 ns (IQR 10.000 ns) | 180.000 ns (IQR 0.000 ns) | 5.830 μs (IQR 10.000 ns) | 469.835 μs (IQR 4.003 μs) | 120.000 ns (IQR 10.000 ns) | 380.000 ns (IQR 10.000 ns) | 6.210 μs (IQR 50.000 ns) | 485.851 μs (IQR 1.160 μs) | 120.000 ns (IQR 10.000 ns) | 450.000 ns (IQR 10.000 ns) | 15.390 μs (IQR 1.252 μs) | 629.649 μs (IQR 950.000 ns) | 130.000 ns (IQR 0.000 ns) | 540.000 ns (IQR 10.000 ns) | 141.224 μs (IQR 3.203 μs) | 1.644 ms (IQR 9.440 μs) | 
-| BasicInterpolators | 60.000 ns (IQR 0.000 ns) | 200.000 ns (IQR 0.000 ns) | 16.205 μs (IQR 350.250 ns) | 1.378 ms (IQR 13.425 μs) | 70.000 ns (IQR 10.000 ns) | 240.000 ns (IQR 0.000 ns) | 41.170 μs (IQR 2.439 μs) | 2.053 ms (IQR 9.387 μs) | 70.000 ns (IQR 10.000 ns) | 310.000 ns (IQR 0.000 ns) | 76.659 μs (IQR 3.703 μs) | 4.179 ms (IQR 15.650 μs) | 80.000 ns (IQR 0.000 ns) | 380.000 ns (IQR 10.000 ns) | 123.879 μs (IQR 2.312 μs) | 7.892 ms (IQR 63.663 μs) | 
-| Dierckx (k=1) | 150.000 ns (IQR 10.000 ns) | 850.000 ns (IQR 10.000 ns) | 87.719 μs (IQR 1.460 μs) | 8.265 ms (IQR 132.779 μs) | 670.000 ns (IQR 10.000 ns) | 3.280 μs (IQR 820.000 ns) | 373.336 μs (IQR 5.365 μs) | 37.651 ms (IQR 73.838 μs) | 5.660 μs (IQR 30.000 ns) | 26.730 μs (IQR 50.000 ns) | 3.168 ms (IQR 24.134 μs) | 319.511 ms (IQR 16.000 μs) | 55.640 μs (IQR 113.250 ns) | 261.808 μs (IQR 933.000 ns) | 31.246 ms (IQR 377.619 μs) | 3.186 s (IQR 0.000 ns) | 
-| Interpolations (gridded) | 70.000 ns (IQR 0.000 ns) | 230.000 ns (IQR 0.000 ns) | 18.250 μs (IQR 50.250 ns) | 1.635 ms (IQR 23.676 μs) | 70.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 0.000 ns) | 48.190 μs (IQR 3.190 μs) | 2.548 ms (IQR 41.645 μs) | 80.000 ns (IQR 0.000 ns) | 360.000 ns (IQR 10.000 ns) | 90.964 μs (IQR 3.175 μs) | 4.704 ms (IQR 63.885 μs) | 84.500 ns (IQR 10.000 ns) | 430.000 ns (IQR 0.000 ns) | 141.284 μs (IQR 2.475 μs) | 7.996 ms (IQR 40.135 μs) | 
-| Interpolations (uniform) | 60.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.610 μs (IQR 0.000 ns) | 655.124 μs (IQR 583.250 ns) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.600 μs (IQR 20.000 ns) | 655.409 μs (IQR 12.107 μs) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.670 μs (IQR 30.000 ns) | 655.644 μs (IQR 702.500 ns) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 7.060 μs (IQR 50.000 ns) | 658.249 μs (IQR 1.255 μs) | 
+| DataInterpolations | 120.000 ns (IQR 10.000 ns) | 180.000 ns (IQR 10.000 ns) | 6.490 μs (IQR 10.000 ns) | 530.655 μs (IQR 2.315 μs) | 130.000 ns (IQR 0.000 ns) | 380.000 ns (IQR 0.000 ns) | 7.010 μs (IQR 10.000 ns) | 541.605 μs (IQR 889.250 ns) | 140.000 ns (IQR 0.000 ns) | 470.000 ns (IQR 10.000 ns) | 15.860 μs (IQR 50.250 ns) | 685.063 μs (IQR 7.840 μs) | 150.000 ns (IQR 10.000 ns) | 550.000 ns (IQR 0.000 ns) | 143.244 μs (IQR 4.605 μs) | 1.653 ms (IQR 13.035 μs) | 
+| BasicInterpolators | 60.000 ns (IQR 10.000 ns) | 190.000 ns (IQR 0.000 ns) | 16.470 μs (IQR 322.500 ns) | 1.399 ms (IQR 16.903 μs) | 70.000 ns (IQR 0.000 ns) | 240.000 ns (IQR 0.000 ns) | 42.279 μs (IQR 3.697 μs) | 2.052 ms (IQR 12.033 μs) | 70.000 ns (IQR 0.000 ns) | 310.000 ns (IQR 10.000 ns) | 75.574 μs (IQR 5.532 μs) | 4.203 ms (IQR 42.208 μs) | 80.000 ns (IQR 0.000 ns) | 380.000 ns (IQR 10.000 ns) | 123.084 μs (IQR 1.998 μs) | 7.835 ms (IQR 64.520 μs) | 
+| Dierckx (k=1) | 150.000 ns (IQR 0.000 ns) | 840.000 ns (IQR 10.000 ns) | 86.449 μs (IQR 320.000 ns) | 8.338 ms (IQR 205.934 μs) | 670.000 ns (IQR 0.000 ns) | 3.270 μs (IQR 40.000 ns) | 373.326 μs (IQR 591.750 ns) | 37.456 ms (IQR 86.332 μs) | 5.660 μs (IQR 20.000 ns) | 26.600 μs (IQR 30.000 ns) | 3.172 ms (IQR 37.733 μs) | 319.279 ms (IQR 135.094 μs) | 55.620 μs (IQR 93.250 ns) | 263.383 μs (IQR 1.763 μs) | 31.217 ms (IQR 137.637 μs) | 3.147 s (IQR 0.000 ns) | 
+| FastInterpolations | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 4.220 μs (IQR 90.000 ns) | 370.687 μs (IQR 3.397 μs) | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 4.145 μs (IQR 30.000 ns) | 372.367 μs (IQR 3.388 μs) | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 4.200 μs (IQR 82.500 ns) | 373.437 μs (IQR 4.133 μs) | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 4.370 μs (IQR 72.500 ns) | 374.116 μs (IQR 4.323 μs) | 
+| Interpolations (gridded) | 70.000 ns (IQR 0.000 ns) | 230.000 ns (IQR 0.000 ns) | 18.080 μs (IQR 50.000 ns) | 1.644 ms (IQR 26.273 μs) | 80.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 0.000 ns) | 52.349 μs (IQR 3.364 μs) | 2.509 ms (IQR 35.296 μs) | 80.000 ns (IQR 10.000 ns) | 350.000 ns (IQR 10.000 ns) | 93.839 μs (IQR 3.115 μs) | 4.435 ms (IQR 47.497 μs) | 110.000 ns (IQR 10.000 ns) | 430.000 ns (IQR 10.000 ns) | 139.209 μs (IQR 4.602 μs) | 7.831 ms (IQR 71.805 μs) | 
+| Interpolations (uniform) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 10.000 ns) | 6.610 μs (IQR 20.000 ns) | 655.379 μs (IQR 612.250 ns) | 70.000 ns (IQR 0.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.610 μs (IQR 20.000 ns) | 655.654 μs (IQR 1.357 μs) | 70.000 ns (IQR 0.000 ns) | 120.000 ns (IQR 10.000 ns) | 6.665 μs (IQR 20.000 ns) | 655.439 μs (IQR 542.500 ns) | 70.000 ns (IQR 0.000 ns) | 120.000 ns (IQR 10.000 ns) | 7.050 μs (IQR 30.250 ns) | 655.829 μs (IQR 6.360 μs) | 
 
 ### MonotoneCubic
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations (CubicHermite) | 130.000 ns (IQR 30.000 ns) | 340.000 ns (IQR 10.000 ns) | 10.490 μs (IQR 20.250 ns) | 988.671 μs (IQR 9.099 μs) | 140.000 ns (IQR 10.000 ns) | 420.000 ns (IQR 10.000 ns) | 10.649 μs (IQR 30.000 ns) | 989.491 μs (IQR 14.422 μs) | 140.000 ns (IQR 0.000 ns) | 500.000 ns (IQR 10.000 ns) | 19.150 μs (IQR 80.000 ns) | 1.067 ms (IQR 11.665 μs) | 150.000 ns (IQR 0.000 ns) | 580.000 ns (IQR 10.000 ns) | 146.929 μs (IQR 2.422 μs) | 1.825 ms (IQR 19.328 μs) | 
-| PCHIPInterpolation | 70.000 ns (IQR 10.000 ns) | 240.000 ns (IQR 0.000 ns) | 20.389 μs (IQR 437.500 ns) | 1.867 ms (IQR 24.703 μs) | 90.000 ns (IQR 0.000 ns) | 330.000 ns (IQR 0.000 ns) | 39.885 μs (IQR 881.750 ns) | 2.972 ms (IQR 17.169 μs) | 100.000 ns (IQR 0.000 ns) | 440.000 ns (IQR 10.000 ns) | 79.079 μs (IQR 4.630 μs) | 5.475 ms (IQR 51.462 μs) | 110.000 ns (IQR 0.000 ns) | 510.000 ns (IQR 10.000 ns) | 133.694 μs (IQR 4.237 μs) | 9.703 ms (IQR 97.707 μs) | 
+| DataInterpolations (CubicHermite) | 130.000 ns (IQR 0.000 ns) | 230.000 ns (IQR 10.000 ns) | 10.500 μs (IQR 10.000 ns) | 983.576 μs (IQR 12.512 μs) | 130.000 ns (IQR 10.000 ns) | 430.000 ns (IQR 0.000 ns) | 10.660 μs (IQR 20.000 ns) | 992.811 μs (IQR 10.555 μs) | 140.000 ns (IQR 10.000 ns) | 510.000 ns (IQR 0.000 ns) | 18.420 μs (IQR 41.000 ns) | 1.075 ms (IQR 11.249 μs) | 150.000 ns (IQR 10.000 ns) | 600.000 ns (IQR 20.000 ns) | 147.614 μs (IQR 2.352 μs) | 1.812 ms (IQR 21.045 μs) | 
+| FastInterpolations (PCHIP) | 60.000 ns (IQR 0.000 ns) | 160.000 ns (IQR 10.000 ns) | 11.139 μs (IQR 10.000 ns) | 1.072 ms (IQR 3.803 μs) | 60.000 ns (IQR 0.000 ns) | 160.000 ns (IQR 10.000 ns) | 11.190 μs (IQR 30.000 ns) | 1.072 ms (IQR 11.660 μs) | 60.000 ns (IQR 0.000 ns) | 170.000 ns (IQR 10.000 ns) | 11.160 μs (IQR 72.250 ns) | 1.081 ms (IQR 23.755 μs) | 60.000 ns (IQR 0.000 ns) | 160.000 ns (IQR 10.000 ns) | 11.830 μs (IQR 112.750 ns) | 1.073 ms (IQR 7.117 μs) | 
+| PCHIPInterpolation | 70.000 ns (IQR 0.000 ns) | 240.000 ns (IQR 0.000 ns) | 20.294 μs (IQR 322.250 ns) | 1.864 ms (IQR 11.880 μs) | 90.000 ns (IQR 0.000 ns) | 320.000 ns (IQR 10.000 ns) | 40.360 μs (IQR 1.312 μs) | 2.973 ms (IQR 40.100 μs) | 100.000 ns (IQR 0.000 ns) | 450.000 ns (IQR 2.500 ns) | 79.409 μs (IQR 2.623 μs) | 5.436 ms (IQR 51.495 μs) | 120.000 ns (IQR 10.000 ns) | 510.000 ns (IQR 10.000 ns) | 134.408 μs (IQR 3.429 μs) | 9.598 ms (IQR 69.869 μs) | 
 
 ### QuadraticSpline
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 290.000 ns (IQR 10.000 ns) | 1.370 μs (IQR 0.000 ns) | 137.279 μs (IQR 811.750 ns) | 13.395 ms (IQR 177.476 μs) | 1.260 μs (IQR 0.000 ns) | 6.600 μs (IQR 12.250 ns) | 722.878 μs (IQR 1.238 μs) | 72.672 ms (IQR 365.231 μs) | 10.915 μs (IQR 30.000 ns) | 56.859 μs (IQR 70.000 ns) | 6.588 ms (IQR 72.728 μs) | 660.689 ms (IQR 0.000 ns) | 112.729 μs (IQR 162.500 ns) | 607.684 μs (IQR 7.387 μs) | 70.380 ms (IQR 419.419 μs) | 7.038 s (IQR 0.000 ns) | 
-| Dierckx (k=2) | 170.000 ns (IQR 0.000 ns) | 1.030 μs (IQR 10.000 ns) | 103.394 μs (IQR 260.000 ns) | 9.983 ms (IQR 106.786 μs) | 680.000 ns (IQR 10.000 ns) | 3.450 μs (IQR 10.000 ns) | 390.976 μs (IQR 1.002 μs) | 39.394 ms (IQR 210.678 μs) | 5.690 μs (IQR 13.250 ns) | 26.760 μs (IQR 20.000 ns) | 3.190 ms (IQR 47.677 μs) | 322.009 ms (IQR 65.414 μs) | 55.739 μs (IQR 115.000 ns) | 260.118 μs (IQR 761.500 ns) | 31.568 ms (IQR 621.605 μs) | 3.207 s (IQR 0.000 ns) | 
+| DataInterpolations | 210.000 ns (IQR 0.000 ns) | 1.010 μs (IQR 0.000 ns) | 110.119 μs (IQR 162.500 ns) | 9.480 ms (IQR 53.279 μs) | 310.000 ns (IQR 0.000 ns) | 2.420 μs (IQR 10.000 ns) | 222.133 μs (IQR 455.000 ns) | 18.933 ms (IQR 74.185 μs) | 1.300 μs (IQR 10.000 ns) | 12.569 μs (IQR 59.250 ns) | 1.227 ms (IQR 5.570 μs) | 117.928 ms (IQR 382.237 μs) | 14.610 μs (IQR 70.000 ns) | 144.098 μs (IQR 315.250 ns) | 14.771 ms (IQR 263.223 μs) | 1.477 s (IQR 0.000 ns) | 
+| Dierckx (k=2) | 170.000 ns (IQR 2.500 ns) | 1.040 μs (IQR 10.000 ns) | 103.589 μs (IQR 329.250 ns) | 9.887 ms (IQR 85.805 μs) | 690.000 ns (IQR 0.000 ns) | 3.440 μs (IQR 10.000 ns) | 391.187 μs (IQR 620.250 ns) | 39.289 ms (IQR 132.329 μs) | 5.669 μs (IQR 20.000 ns) | 26.799 μs (IQR 21.000 ns) | 3.180 ms (IQR 3.583 μs) | 320.143 ms (IQR 155.369 μs) | 55.730 μs (IQR 89.000 ns) | 260.017 μs (IQR 267.500 ns) | 31.216 ms (IQR 132.239 μs) | 3.154 s (IQR 0.000 ns) | 
+| FastInterpolations | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 10.000 ns) | 3.910 μs (IQR 20.000 ns) | 349.737 μs (IQR 3.685 μs) | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 10.000 ns) | 3.990 μs (IQR 60.000 ns) | 350.812 μs (IQR 3.107 μs) | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 10.000 ns) | 4.320 μs (IQR 62.500 ns) | 351.341 μs (IQR 3.715 μs) | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 10.000 ns) | 5.560 μs (IQR 80.000 ns) | 359.077 μs (IQR 9.547 μs) | 
 
 ## Random batch
 
@@ -186,40 +184,45 @@ Cold single evaluation `A(x_query)`. Rows = library, columns = (n, knot pattern)
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 120.000 ns (IQR 10.000 ns) | 450.000 ns (IQR 0.000 ns) | 47.359 μs (IQR 171.500 ns) | 4.831 ms (IQR 31.837 μs) | 120.000 ns (IQR 0.000 ns) | 450.000 ns (IQR 0.000 ns) | 48.005 μs (IQR 194.750 ns) | 4.898 ms (IQR 32.682 μs) | 130.000 ns (IQR 10.000 ns) | 430.000 ns (IQR 10.000 ns) | 52.684 μs (IQR 263.500 ns) | 5.357 ms (IQR 57.461 μs) | 140.000 ns (IQR 10.000 ns) | 440.000 ns (IQR 10.000 ns) | 59.049 μs (IQR 342.500 ns) | 6.366 ms (IQR 52.595 μs) | 
+| DataInterpolations | 120.000 ns (IQR 10.000 ns) | 440.000 ns (IQR 10.000 ns) | 85.734 μs (IQR 283.250 ns) | 8.733 ms (IQR 42.521 μs) | 120.000 ns (IQR 0.000 ns) | 760.000 ns (IQR 60.000 ns) | 113.999 μs (IQR 2.893 μs) | 11.877 ms (IQR 130.729 μs) | 130.000 ns (IQR 0.000 ns) | 620.000 ns (IQR 10.000 ns) | 144.079 μs (IQR 3.071 μs) | 15.912 ms (IQR 39.300 μs) | 130.000 ns (IQR 10.000 ns) | 750.000 ns (IQR 10.000 ns) | 209.804 μs (IQR 3.175 μs) | 22.256 ms (IQR 44.275 μs) | 
+| FastInterpolations | 60.000 ns (IQR 10.000 ns) | 170.000 ns (IQR 10.000 ns) | 11.150 μs (IQR 0.000 ns) | 1.071 ms (IQR 7.907 μs) | 60.000 ns (IQR 0.000 ns) | 190.000 ns (IQR 0.000 ns) | 11.180 μs (IQR 30.000 ns) | 1.071 ms (IQR 5.312 μs) | 60.000 ns (IQR 10.000 ns) | 180.000 ns (IQR 10.000 ns) | 11.180 μs (IQR 40.000 ns) | 1.070 ms (IQR 5.062 μs) | 60.000 ns (IQR 0.000 ns) | 180.000 ns (IQR 10.000 ns) | 11.215 μs (IQR 60.250 ns) | 1.115 ms (IQR 5.000 μs) | 
 
 ### CubicSpline
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 130.000 ns (IQR 10.000 ns) | 490.000 ns (IQR 10.000 ns) | 51.094 μs (IQR 95.500 ns) | 5.201 ms (IQR 58.934 μs) | 130.000 ns (IQR 0.000 ns) | 490.000 ns (IQR 0.000 ns) | 52.210 μs (IQR 255.000 ns) | 5.480 ms (IQR 26.636 μs) | 140.000 ns (IQR 0.000 ns) | 480.000 ns (IQR 0.000 ns) | 55.980 μs (IQR 354.750 ns) | 5.666 ms (IQR 48.039 μs) | 150.000 ns (IQR 10.000 ns) | 500.000 ns (IQR 10.000 ns) | 63.150 μs (IQR 3.263 μs) | 6.874 ms (IQR 47.719 μs) | 
-| BasicInterpolators | 70.000 ns (IQR 10.000 ns) | 190.000 ns (IQR 0.000 ns) | 28.160 μs (IQR 695.000 ns) | 6.444 ms (IQR 72.182 μs) | 70.000 ns (IQR 0.000 ns) | 240.000 ns (IQR 10.000 ns) | 69.590 μs (IQR 4.885 μs) | 10.042 ms (IQR 149.286 μs) | 70.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 0.000 ns) | 110.244 μs (IQR 3.438 μs) | 13.575 ms (IQR 158.219 μs) | 80.000 ns (IQR 0.000 ns) | 360.000 ns (IQR 0.000 ns) | 172.224 μs (IQR 7.392 μs) | 19.794 ms (IQR 117.482 μs) | 
-| Dierckx (k=3) | 150.000 ns (IQR 10.000 ns) | 1.260 μs (IQR 20.000 ns) | 134.564 μs (IQR 305.000 ns) | 13.506 ms (IQR 43.390 μs) | 280.000 ns (IQR 10.000 ns) | 3.950 μs (IQR 10.000 ns) | 412.066 μs (IQR 282.500 ns) | 41.346 ms (IQR 455.686 μs) | 1.490 μs (IQR 0.000 ns) | 30.060 μs (IQR 30.000 ns) | 3.247 ms (IQR 47.519 μs) | 323.084 ms (IQR 648.144 μs) | 13.470 μs (IQR 80.000 ns) | 291.452 μs (IQR 1.265 μs) | 31.720 ms (IQR 238.153 μs) | 3.151 s (IQR 0.000 ns) | 
-| Interpolations (uniform) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 10.000 ns) | 20.459 μs (IQR 10.000 ns) | 2.048 ms (IQR 8.437 μs) | 80.000 ns (IQR 10.000 ns) | 260.000 ns (IQR 10.000 ns) | 20.440 μs (IQR 52.500 ns) | 2.047 ms (IQR 13.848 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.430 μs (IQR 20.000 ns) | 2.049 ms (IQR 31.699 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.420 μs (IQR 20.000 ns) | 2.061 ms (IQR 28.078 μs) | 
+| DataInterpolations | 130.000 ns (IQR 0.000 ns) | 510.000 ns (IQR 10.000 ns) | 88.379 μs (IQR 315.750 ns) | 8.819 ms (IQR 37.679 μs) | 130.000 ns (IQR 10.000 ns) | 790.000 ns (IQR 10.000 ns) | 116.909 μs (IQR 462.500 ns) | 11.897 ms (IQR 63.819 μs) | 140.000 ns (IQR 0.000 ns) | 740.000 ns (IQR 10.000 ns) | 145.738 μs (IQR 2.996 μs) | 16.274 ms (IQR 145.029 μs) | 150.000 ns (IQR 0.000 ns) | 740.000 ns (IQR 10.000 ns) | 221.258 μs (IQR 1.857 μs) | 24.186 ms (IQR 232.969 μs) | 
+| BasicInterpolators | 60.000 ns (IQR 0.000 ns) | 200.000 ns (IQR 10.000 ns) | 26.510 μs (IQR 1.024 μs) | 6.469 ms (IQR 35.997 μs) | 70.000 ns (IQR 0.000 ns) | 240.000 ns (IQR 10.000 ns) | 64.219 μs (IQR 3.527 μs) | 9.810 ms (IQR 34.904 μs) | 70.000 ns (IQR 10.000 ns) | 300.000 ns (IQR 0.000 ns) | 107.729 μs (IQR 3.515 μs) | 13.373 ms (IQR 124.972 μs) | 80.000 ns (IQR 0.000 ns) | 360.000 ns (IQR 0.000 ns) | 171.113 μs (IQR 4.553 μs) | 19.801 ms (IQR 558.067 μs) | 
+| Dierckx (k=3) | 150.000 ns (IQR 10.000 ns) | 1.250 μs (IQR 0.000 ns) | 134.424 μs (IQR 462.250 ns) | 13.515 ms (IQR 60.659 μs) | 290.000 ns (IQR 10.000 ns) | 3.960 μs (IQR 10.000 ns) | 412.197 μs (IQR 334.250 ns) | 41.079 ms (IQR 50.310 μs) | 1.480 μs (IQR 0.000 ns) | 30.050 μs (IQR 30.000 ns) | 3.232 ms (IQR 6.122 μs) | 321.523 ms (IQR 211.493 μs) | 13.540 μs (IQR 80.000 ns) | 291.423 μs (IQR 211.500 ns) | 31.510 ms (IQR 153.314 μs) | 3.190 s (IQR 0.000 ns) | 
+| FastInterpolations | 60.000 ns (IQR 2.500 ns) | 150.000 ns (IQR 0.000 ns) | 8.980 μs (IQR 10.000 ns) | 860.512 μs (IQR 4.238 μs) | 60.000 ns (IQR 0.000 ns) | 150.000 ns (IQR 0.000 ns) | 8.960 μs (IQR 60.000 ns) | 847.768 μs (IQR 4.537 μs) | 60.000 ns (IQR 0.000 ns) | 150.000 ns (IQR 0.000 ns) | 8.980 μs (IQR 40.000 ns) | 854.847 μs (IQR 8.707 μs) | 60.000 ns (IQR 0.000 ns) | 150.000 ns (IQR 0.000 ns) | 9.140 μs (IQR 40.000 ns) | 1.037 ms (IQR 5.805 μs) | 
+| Interpolations (uniform) | 90.000 ns (IQR 0.000 ns) | 270.000 ns (IQR 10.000 ns) | 20.430 μs (IQR 20.000 ns) | 2.046 ms (IQR 7.638 μs) | 90.000 ns (IQR 0.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.470 μs (IQR 10.000 ns) | 2.046 ms (IQR 5.918 μs) | 90.000 ns (IQR 0.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.420 μs (IQR 21.000 ns) | 2.044 ms (IQR 7.173 μs) | 90.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 0.000 ns) | 20.450 μs (IQR 5.500 ns) | 2.048 ms (IQR 11.220 μs) | 
 
 ### Linear
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 130.000 ns (IQR 0.000 ns) | 520.000 ns (IQR 10.000 ns) | 55.089 μs (IQR 111.500 ns) | 5.582 ms (IQR 35.069 μs) | 120.000 ns (IQR 0.000 ns) | 510.000 ns (IQR 10.000 ns) | 55.030 μs (IQR 172.500 ns) | 5.565 ms (IQR 31.740 μs) | 130.000 ns (IQR 10.000 ns) | 480.000 ns (IQR 0.000 ns) | 56.074 μs (IQR 649.500 ns) | 5.687 ms (IQR 50.330 μs) | 130.000 ns (IQR 10.000 ns) | 480.000 ns (IQR 0.000 ns) | 58.300 μs (IQR 568.500 ns) | 6.744 ms (IQR 64.104 μs) | 
-| BasicInterpolators | 60.000 ns (IQR 0.000 ns) | 180.000 ns (IQR 10.000 ns) | 29.580 μs (IQR 1.822 μs) | 6.435 ms (IQR 41.382 μs) | 60.000 ns (IQR 10.000 ns) | 230.000 ns (IQR 0.000 ns) | 64.855 μs (IQR 3.784 μs) | 9.784 ms (IQR 57.275 μs) | 70.000 ns (IQR 0.000 ns) | 300.000 ns (IQR 10.000 ns) | 105.934 μs (IQR 1.353 μs) | 13.251 ms (IQR 76.569 μs) | 80.000 ns (IQR 10.000 ns) | 360.000 ns (IQR 10.000 ns) | 167.988 μs (IQR 8.889 μs) | 19.198 ms (IQR 179.439 μs) | 
-| Dierckx (k=1) | 110.000 ns (IQR 0.000 ns) | 880.000 ns (IQR 0.000 ns) | 103.619 μs (IQR 592.500 ns) | 10.349 ms (IQR 87.979 μs) | 250.000 ns (IQR 0.000 ns) | 3.600 μs (IQR 10.000 ns) | 377.267 μs (IQR 260.250 ns) | 37.624 ms (IQR 375.581 μs) | 1.450 μs (IQR 10.000 ns) | 29.650 μs (IQR 23.250 ns) | 3.191 ms (IQR 13.440 μs) | 318.772 ms (IQR 307.167 μs) | 13.470 μs (IQR 40.000 ns) | 291.407 μs (IQR 310.000 ns) | 31.660 ms (IQR 145.164 μs) | 3.181 s (IQR 0.000 ns) | 
-| Interpolations (gridded) | 70.000 ns (IQR 2.500 ns) | 230.000 ns (IQR 10.000 ns) | 21.320 μs (IQR 824.250 ns) | 6.593 ms (IQR 59.599 μs) | 70.000 ns (IQR 10.000 ns) | 290.000 ns (IQR 0.000 ns) | 57.594 μs (IQR 7.278 μs) | 10.134 ms (IQR 55.693 μs) | 100.000 ns (IQR 20.000 ns) | 350.000 ns (IQR 2.500 ns) | 101.449 μs (IQR 5.872 μs) | 13.761 ms (IQR 140.448 μs) | 90.000 ns (IQR 0.000 ns) | 400.000 ns (IQR 10.000 ns) | 166.308 μs (IQR 6.663 μs) | 19.858 ms (IQR 70.962 μs) | 
-| Interpolations (uniform) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 10.000 ns) | 6.560 μs (IQR 40.000 ns) | 655.544 μs (IQR 9.552 μs) | 60.000 ns (IQR 0.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.630 μs (IQR 11.000 ns) | 655.564 μs (IQR 8.735 μs) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 6.889 μs (IQR 10.000 ns) | 683.948 μs (IQR 4.087 μs) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 0.000 ns) | 7.160 μs (IQR 10.000 ns) | 752.648 μs (IQR 1.765 μs) | 
+| DataInterpolations | 120.000 ns (IQR 0.000 ns) | 480.000 ns (IQR 0.000 ns) | 83.519 μs (IQR 372.750 ns) | 8.415 ms (IQR 52.812 μs) | 130.000 ns (IQR 0.000 ns) | 770.000 ns (IQR 12.500 ns) | 108.679 μs (IQR 3.103 μs) | 11.532 ms (IQR 79.008 μs) | 140.000 ns (IQR 0.000 ns) | 700.000 ns (IQR 10.000 ns) | 141.614 μs (IQR 3.540 μs) | 15.566 ms (IQR 113.496 μs) | 150.000 ns (IQR 0.000 ns) | 820.000 ns (IQR 10.000 ns) | 208.248 μs (IQR 2.930 μs) | 22.285 ms (IQR 93.724 μs) | 
+| BasicInterpolators | 60.000 ns (IQR 0.000 ns) | 200.000 ns (IQR 0.000 ns) | 30.665 μs (IQR 533.250 ns) | 6.365 ms (IQR 46.459 μs) | 60.000 ns (IQR 10.000 ns) | 240.000 ns (IQR 0.000 ns) | 65.439 μs (IQR 3.513 μs) | 9.742 ms (IQR 67.108 μs) | 70.000 ns (IQR 0.000 ns) | 290.000 ns (IQR 0.000 ns) | 104.350 μs (IQR 3.683 μs) | 13.157 ms (IQR 127.214 μs) | 80.000 ns (IQR 0.000 ns) | 360.000 ns (IQR 10.000 ns) | 167.203 μs (IQR 4.349 μs) | 19.014 ms (IQR 160.544 μs) | 
+| Dierckx (k=1) | 110.000 ns (IQR 0.000 ns) | 870.000 ns (IQR 10.000 ns) | 98.819 μs (IQR 450.000 ns) | 10.105 ms (IQR 280.429 μs) | 260.000 ns (IQR 60.000 ns) | 3.610 μs (IQR 0.000 ns) | 376.521 μs (IQR 5.056 μs) | 37.694 ms (IQR 182.261 μs) | 1.455 μs (IQR 10.000 ns) | 29.699 μs (IQR 33.250 ns) | 3.194 ms (IQR 5.514 μs) | 321.630 ms (IQR 565.205 μs) | 13.500 μs (IQR 45.000 ns) | 291.442 μs (IQR 304.250 ns) | 31.515 ms (IQR 158.856 μs) | 3.173 s (IQR 0.000 ns) | 
+| FastInterpolations | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 4.240 μs (IQR 0.000 ns) | 392.077 μs (IQR 5.178 μs) | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 4.240 μs (IQR 32.500 ns) | 373.457 μs (IQR 3.303 μs) | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 0.000 ns) | 4.270 μs (IQR 50.000 ns) | 377.542 μs (IQR 4.339 μs) | 50.000 ns (IQR 0.000 ns) | 90.000 ns (IQR 10.000 ns) | 4.350 μs (IQR 30.000 ns) | 464.091 μs (IQR 4.390 μs) | 
+| Interpolations (gridded) | 70.000 ns (IQR 10.000 ns) | 230.000 ns (IQR 10.000 ns) | 25.485 μs (IQR 400.000 ns) | 6.346 ms (IQR 57.190 μs) | 80.000 ns (IQR 10.000 ns) | 270.000 ns (IQR 10.000 ns) | 60.749 μs (IQR 4.149 μs) | 9.964 ms (IQR 113.239 μs) | 80.000 ns (IQR 0.000 ns) | 350.000 ns (IQR 0.000 ns) | 106.214 μs (IQR 5.040 μs) | 13.345 ms (IQR 47.422 μs) | 90.000 ns (IQR 0.000 ns) | 410.000 ns (IQR 0.000 ns) | 172.038 μs (IQR 6.404 μs) | 19.450 ms (IQR 135.066 μs) | 
+| Interpolations (uniform) | 70.000 ns (IQR 2.500 ns) | 120.000 ns (IQR 10.000 ns) | 6.600 μs (IQR 30.000 ns) | 655.404 μs (IQR 625.000 ns) | 70.000 ns (IQR 0.000 ns) | 120.000 ns (IQR 10.000 ns) | 6.600 μs (IQR 20.000 ns) | 661.254 μs (IQR 8.865 μs) | 70.000 ns (IQR 10.000 ns) | 120.000 ns (IQR 10.000 ns) | 6.890 μs (IQR 20.000 ns) | 683.869 μs (IQR 335.000 ns) | 70.000 ns (IQR 0.000 ns) | 120.000 ns (IQR 0.000 ns) | 7.170 μs (IQR 20.000 ns) | 752.364 μs (IQR 8.863 μs) | 
 
 ### MonotoneCubic
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations (CubicHermite) | 130.000 ns (IQR 10.000 ns) | 530.000 ns (IQR 0.000 ns) | 52.569 μs (IQR 80.000 ns) | 5.297 ms (IQR 17.295 μs) | 130.000 ns (IQR 10.000 ns) | 530.000 ns (IQR 10.000 ns) | 53.119 μs (IQR 119.500 ns) | 5.326 ms (IQR 26.192 μs) | 140.000 ns (IQR 10.000 ns) | 520.000 ns (IQR 10.000 ns) | 57.039 μs (IQR 395.000 ns) | 5.697 ms (IQR 20.677 μs) | 150.000 ns (IQR 0.000 ns) | 540.000 ns (IQR 10.000 ns) | 61.514 μs (IQR 244.750 ns) | 7.278 ms (IQR 31.449 μs) | 
-| PCHIPInterpolation | 80.000 ns (IQR 10.000 ns) | 240.000 ns (IQR 10.000 ns) | 24.865 μs (IQR 1.385 μs) | 6.407 ms (IQR 40.035 μs) | 100.000 ns (IQR 20.000 ns) | 340.000 ns (IQR 10.000 ns) | 65.279 μs (IQR 569.000 ns) | 9.842 ms (IQR 42.269 μs) | 90.000 ns (IQR 10.000 ns) | 440.000 ns (IQR 0.000 ns) | 117.314 μs (IQR 3.672 μs) | 14.126 ms (IQR 36.737 μs) | 110.000 ns (IQR 10.000 ns) | 480.000 ns (IQR 10.000 ns) | 182.258 μs (IQR 4.223 μs) | 20.388 ms (IQR 38.910 μs) | 
+| DataInterpolations (CubicHermite) | 130.000 ns (IQR 0.000 ns) | 550.000 ns (IQR 10.000 ns) | 88.869 μs (IQR 182.750 ns) | 8.923 ms (IQR 45.887 μs) | 140.000 ns (IQR 0.000 ns) | 750.000 ns (IQR 10.000 ns) | 114.689 μs (IQR 312.750 ns) | 12.259 ms (IQR 81.830 μs) | 150.000 ns (IQR 0.000 ns) | 760.000 ns (IQR 10.000 ns) | 149.914 μs (IQR 4.128 μs) | 16.358 ms (IQR 36.446 μs) | 160.000 ns (IQR 10.000 ns) | 850.000 ns (IQR 10.000 ns) | 225.383 μs (IQR 3.223 μs) | 24.150 ms (IQR 233.658 μs) | 
+| FastInterpolations (PCHIP) | 60.000 ns (IQR 0.000 ns) | 180.000 ns (IQR 10.000 ns) | 11.240 μs (IQR 10.000 ns) | 1.070 ms (IQR 6.601 μs) | 60.000 ns (IQR 0.000 ns) | 170.000 ns (IQR 0.000 ns) | 11.150 μs (IQR 140.000 ns) | 1.071 ms (IQR 10.822 μs) | 60.000 ns (IQR 0.000 ns) | 180.000 ns (IQR 10.000 ns) | 11.140 μs (IQR 24.750 ns) | 1.068 ms (IQR 5.527 μs) | 60.000 ns (IQR 0.000 ns) | 190.000 ns (IQR 10.000 ns) | 11.240 μs (IQR 40.000 ns) | 1.114 ms (IQR 9.055 μs) | 
+| PCHIPInterpolation | 70.000 ns (IQR 10.000 ns) | 250.000 ns (IQR 0.000 ns) | 25.435 μs (IQR 1.558 μs) | 6.446 ms (IQR 16.104 μs) | 90.000 ns (IQR 0.000 ns) | 345.000 ns (IQR 10.000 ns) | 63.260 μs (IQR 2.118 μs) | 9.963 ms (IQR 79.389 μs) | 90.000 ns (IQR 0.000 ns) | 440.000 ns (IQR 10.000 ns) | 118.869 μs (IQR 4.293 μs) | 14.222 ms (IQR 93.245 μs) | 110.000 ns (IQR 10.000 ns) | 490.000 ns (IQR 10.000 ns) | 185.893 μs (IQR 5.101 μs) | 20.408 ms (IQR 54.869 μs) | 
 
 ### QuadraticSpline
 
 | Library | n=100,m=1 | n=100,m=10 | n=100,m=1000 | n=100,m=100000 | n=1000,m=1 | n=1000,m=10 | n=1000,m=1000 | n=1000,m=100000 | n=10000,m=1 | n=10000,m=10 | n=10000,m=1000 | n=10000,m=100000 | n=100000,m=1 | n=100000,m=10 | n=100000,m=1000 | n=100000,m=100000 | 
 |---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
-| DataInterpolations | 230.000 ns (IQR 10.000 ns) | 1.650 μs (IQR 10.000 ns) | 169.573 μs (IQR 1.357 μs) | 17.094 ms (IQR 49.515 μs) | 540.000 ns (IQR 10.000 ns) | 7.080 μs (IQR 10.000 ns) | 750.153 μs (IQR 7.195 μs) | 74.773 ms (IQR 70.109 μs) | 3.630 μs (IQR 22.250 ns) | 62.340 μs (IQR 43.250 ns) | 6.627 ms (IQR 25.269 μs) | 669.475 ms (IQR 0.000 ns) | 39.715 μs (IQR 720.000 ns) | 663.894 μs (IQR 3.838 μs) | 70.311 ms (IQR 31.738 μs) | 7.058 s (IQR 0.000 ns) | 
-| Dierckx (k=2) | 130.000 ns (IQR 0.000 ns) | 1.060 μs (IQR 0.000 ns) | 116.774 μs (IQR 711.750 ns) | 11.700 ms (IQR 35.465 μs) | 270.000 ns (IQR 10.000 ns) | 3.790 μs (IQR 10.000 ns) | 394.467 μs (IQR 301.750 ns) | 39.408 ms (IQR 62.060 μs) | 1.480 μs (IQR 2.500 ns) | 29.880 μs (IQR 30.000 ns) | 3.209 ms (IQR 5.805 μs) | 320.457 ms (IQR 632.470 μs) | 13.500 μs (IQR 50.000 ns) | 291.127 μs (IQR 298.500 ns) | 31.489 ms (IQR 130.091 μs) | 3.195 s (IQR 0.000 ns) | 
+| DataInterpolations | 210.000 ns (IQR 0.000 ns) | 1.270 μs (IQR 0.000 ns) | 188.969 μs (IQR 920.000 ns) | 19.321 ms (IQR 149.183 μs) | 310.000 ns (IQR 10.000 ns) | 2.720 μs (IQR 10.000 ns) | 347.986 μs (IQR 3.498 μs) | 36.760 ms (IQR 66.121 μs) | 1.300 μs (IQR 20.000 ns) | 12.700 μs (IQR 61.750 ns) | 1.444 ms (IQR 9.453 μs) | 145.560 ms (IQR 123.712 μs) | 15.650 μs (IQR 700.000 ns) | 146.198 μs (IQR 282.250 ns) | 16.271 ms (IQR 285.353 μs) | 1.616 s (IQR 0.000 ns) | 
+| Dierckx (k=2) | 130.000 ns (IQR 0.000 ns) | 1.060 μs (IQR 10.000 ns) | 117.319 μs (IQR 3.700 μs) | 11.766 ms (IQR 113.288 μs) | 270.000 ns (IQR 10.000 ns) | 3.780 μs (IQR 0.000 ns) | 394.716 μs (IQR 372.250 ns) | 39.406 ms (IQR 139.238 μs) | 1.470 μs (IQR 20.000 ns) | 29.990 μs (IQR 44.750 ns) | 3.214 ms (IQR 5.622 μs) | 320.480 ms (IQR 312.612 μs) | 13.520 μs (IQR 90.000 ns) | 291.358 μs (IQR 312.500 ns) | 32.152 ms (IQR 591.392 μs) | 3.155 s (IQR 0.000 ns) | 
+| FastInterpolations | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 0.000 ns) | 4.030 μs (IQR 30.000 ns) | 366.447 μs (IQR 4.920 μs) | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 0.000 ns) | 4.000 μs (IQR 50.000 ns) | 351.122 μs (IQR 4.475 μs) | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 2.500 ns) | 4.150 μs (IQR 50.000 ns) | 412.296 μs (IQR 4.755 μs) | 50.000 ns (IQR 10.000 ns) | 110.000 ns (IQR 0.000 ns) | 4.475 μs (IQR 80.000 ns) | 478.275 μs (IQR 4.135 μs) | 
 
 ## Chained ODE-style
 
@@ -229,51 +232,160 @@ Sequential `for x in tt; A(x); end` over a monotone sequence. (knot pattern = un
 
 | Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
 |---|---|---|---|---|
-| DataInterpolations | 40.720 μs (IQR 21.000 ns) | 47.709 μs (IQR 51.000 ns) | 47.785 μs (IQR 129.250 ns) | 63.300 μs (IQR 381.500 ns) | 
+| DataInterpolations | 55.874 μs (IQR 224.000 ns) | 80.234 μs (IQR 400.250 ns) | 116.019 μs (IQR 2.942 μs) | 163.899 μs (IQR 4.407 μs) | 
+| FastInterpolations | 10.970 μs (IQR 9.250 ns) | 11.040 μs (IQR 1.000 ns) | 11.030 μs (IQR 410.000 ns) | 11.420 μs (IQR 93.250 ns) | 
 
 ### CubicSpline
 
 | Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
 |---|---|---|---|---|
-| DataInterpolations | 46.169 μs (IQR 20.000 ns) | 52.069 μs (IQR 350.000 ns) | 52.645 μs (IQR 225.500 ns) | 69.550 μs (IQR 362.500 ns) | 
-| BasicInterpolators | 16.989 μs (IQR 459.250 ns) | 47.639 μs (IQR 1.077 μs) | 86.939 μs (IQR 2.837 μs) | 136.684 μs (IQR 2.812 μs) | 
-| Dierckx (k=3) | 122.399 μs (IQR 52.500 ns) | 409.806 μs (IQR 50.000 ns) | 3.212 ms (IQR 2.620 μs) | 31.457 ms (IQR 222.590 μs) | 
-| Interpolations (uniform) | 27.750 μs (IQR 600.000 ns) | 27.749 μs (IQR 499.250 ns) | 27.750 μs (IQR 1.179 μs) | 27.750 μs (IQR 440.000 ns) | 
+| DataInterpolations | 59.995 μs (IQR 562.250 ns) | 81.979 μs (IQR 374.500 ns) | 113.249 μs (IQR 3.044 μs) | 178.064 μs (IQR 5.123 μs) | 
+| BasicInterpolators | 17.450 μs (IQR 357.500 ns) | 45.319 μs (IQR 1.970 μs) | 85.799 μs (IQR 2.695 μs) | 140.149 μs (IQR 2.475 μs) | 
+| Dierckx (k=3) | 122.163 μs (IQR 72.250 ns) | 410.447 μs (IQR 169.250 ns) | 3.214 ms (IQR 6.145 μs) | 31.322 ms (IQR 130.226 μs) | 
+| FastInterpolations | 10.150 μs (IQR 10.000 ns) | 10.140 μs (IQR 20.000 ns) | 10.160 μs (IQR 12.250 ns) | 10.950 μs (IQR 99.250 ns) | 
+| Interpolations (uniform) | 27.260 μs (IQR 490.000 ns) | 27.850 μs (IQR 0.250 ns) | 27.509 μs (IQR 500.000 ns) | 27.720 μs (IQR 420.000 ns) | 
 
 ### Linear
 
 | Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
 |---|---|---|---|---|
-| DataInterpolations | 42.920 μs (IQR 10.000 ns) | 49.549 μs (IQR 130.250 ns) | 50.259 μs (IQR 159.250 ns) | 55.679 μs (IQR 428.000 ns) | 
-| BasicInterpolators | 17.259 μs (IQR 92.500 ns) | 44.764 μs (IQR 3.072 μs) | 82.629 μs (IQR 2.270 μs) | 132.393 μs (IQR 2.408 μs) | 
-| Dierckx (k=1) | 87.039 μs (IQR 70.000 ns) | 374.796 μs (IQR 415.500 ns) | 3.199 ms (IQR 48.275 μs) | 31.242 ms (IQR 56.158 μs) | 
-| Interpolations (gridded) | 23.920 μs (IQR 449.750 ns) | 58.344 μs (IQR 2.035 μs) | 87.894 μs (IQR 3.572 μs) | 141.208 μs (IQR 3.995 μs) | 
-| Interpolations (uniform) | 23.050 μs (IQR 21.000 ns) | 23.060 μs (IQR 30.000 ns) | 23.040 μs (IQR 50.000 ns) | 23.129 μs (IQR 40.000 ns) | 
+| DataInterpolations | 55.260 μs (IQR 104.750 ns) | 77.310 μs (IQR 362.500 ns) | 109.109 μs (IQR 3.022 μs) | 162.824 μs (IQR 2.605 μs) | 
+| BasicInterpolators | 17.130 μs (IQR 430.000 ns) | 49.775 μs (IQR 2.400 μs) | 87.274 μs (IQR 4.043 μs) | 135.179 μs (IQR 2.735 μs) | 
+| Dierckx (k=1) | 86.279 μs (IQR 450.000 ns) | 374.666 μs (IQR 50.000 ns) | 3.185 ms (IQR 19.682 μs) | 31.293 ms (IQR 85.214 μs) | 
+| FastInterpolations | 3.510 μs (IQR 10.000 ns) | 3.500 μs (IQR 20.000 ns) | 3.550 μs (IQR 12.250 ns) | 3.650 μs (IQR 10.000 ns) | 
+| Interpolations (gridded) | 23.720 μs (IQR 162.500 ns) | 56.059 μs (IQR 2.413 μs) | 89.024 μs (IQR 3.799 μs) | 139.869 μs (IQR 3.240 μs) | 
+| Interpolations (uniform) | 23.050 μs (IQR 11.000 ns) | 23.050 μs (IQR 30.000 ns) | 23.059 μs (IQR 10.000 ns) | 23.120 μs (IQR 39.250 ns) | 
 
 ### MonotoneCubic
 
 | Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
 |---|---|---|---|---|
-| DataInterpolations (CubicHermite) | 50.009 μs (IQR 30.000 ns) | 54.480 μs (IQR 109.000 ns) | 53.984 μs (IQR 110.000 ns) | 71.909 μs (IQR 809.250 ns) | 
-| PCHIPInterpolation | 25.240 μs (IQR 300.000 ns) | 50.559 μs (IQR 934.000 ns) | 93.234 μs (IQR 1.728 μs) | 148.724 μs (IQR 7.090 μs) | 
+| DataInterpolations (CubicHermite) | 67.909 μs (IQR 212.750 ns) | 89.499 μs (IQR 411.750 ns) | 121.504 μs (IQR 4.065 μs) | 180.869 μs (IQR 3.533 μs) | 
+| FastInterpolations (PCHIP) | 11.170 μs (IQR 10.000 ns) | 11.070 μs (IQR 100.000 ns) | 11.020 μs (IQR 45.000 ns) | 11.380 μs (IQR 80.000 ns) | 
+| PCHIPInterpolation | 25.144 μs (IQR 229.250 ns) | 53.205 μs (IQR 303.250 ns) | 94.259 μs (IQR 1.500 μs) | 150.668 μs (IQR 4.713 μs) | 
 
 ### QuadraticSpline
 
 | Library | n=100,m=1000 | n=1000,m=1000 | n=10000,m=1000 | n=100000,m=1000 | 
 |---|---|---|---|---|
-| DataInterpolations | 163.768 μs (IQR 173.250 ns) | 743.168 μs (IQR 397.500 ns) | 6.613 ms (IQR 60.383 μs) | 70.305 ms (IQR 457.841 μs) | 
-| Dierckx (k=2) | 104.904 μs (IQR 220.000 ns) | 393.182 μs (IQR 351.000 ns) | 3.190 ms (IQR 1.820 μs) | 31.236 ms (IQR 63.944 μs) | 
+| DataInterpolations | 137.358 μs (IQR 460.500 ns) | 268.752 μs (IQR 559.250 ns) | 1.322 ms (IQR 6.378 μs) | 15.843 ms (IQR 1.173 ms) | 
+| Dierckx (k=2) | 104.454 μs (IQR 240.000 ns) | 393.216 μs (IQR 341.000 ns) | 3.187 ms (IQR 5.403 μs) | 31.297 ms (IQR 52.556 μs) | 
+| FastInterpolations | 3.310 μs (IQR 2.500 ns) | 3.310 μs (IQR 10.000 ns) | 3.450 μs (IQR 20.000 ns) | 4.650 μs (IQR 40.000 ns) | 
+
+## FastInterpolations.jl advertised benchmark
+
+Numbers below come from `bench/fast_interpolations_bench.jl`, a port of
+FastInterpolations.jl's own `benchmark/interpolation_benchmark.jl`
+(ProjectTorreyPines/FastInterpolations.jl, upstream commit `616b106b`). It runs
+the matrix-of-interpolants workload they advertise on their README:
+`mpert × mpert` independent 1D interpolants over a shared uniform
+`range(0.0, 1.0; length = npsi)` grid, evaluated at `n_eval` query points
+clustered near psi=0 (cubic spacing — mimics ODE solver behavior near
+singular surfaces). Default size: `npsi = 64`, `mpert = 100`, `n_eval = 1000`
+(10⁴ interpolants × 10³ queries = 10⁷ total scalar evaluations).
+
+### Cubic spline, `--default` (npsi=64, mpert=100, n_eval=1000)
+
+| Package | Init (ms) | Eval (ms) | Total (ms) | Speedup vs DI scalar |
+|---|---|---|---|---|
+| FastInterpolations.jl (Series+scalar) | 16.508 | 5.751 | 22.259 | 73.28× |
+| FastInterpolations.jl (Series+vector) | 16.508 | 22.521 | 39.029 | 41.80× |
+| FastInterpolations.jl (vector)        | 31.631 | 95.125 | 126.757 | 12.87× |
+| DataInterpolations.jl (vector)        | 93.259 | 103.438 | 196.697 |  8.29× |
+| FastInterpolations.jl (scalar)        | 31.631 | 171.245 | 202.876 |  8.04× |
+| Interpolations.jl (broadcast)         | 139.363 | 212.500 | 351.863 |  4.64× |
+| Interpolations.jl (scalar)            | 139.363 | 427.833 | 567.196 |  2.88× |
+| Dierckx.jl (vector)                   | 127.741 | 566.160 | 693.901 |  2.35× |
+| DataInterpolations.jl (scalar)        |  93.259 | 1537.974 | 1631.233 | 1.00× |
+| Dierckx.jl (scalar)                   | 127.741 | 1590.398 | 1718.139 | 0.95× |
+
+### Linear, `--default` (npsi=64, mpert=100, n_eval=1000)
+
+| Package | Init (ms) | Eval (ms) | Total (ms) | Speedup vs DI scalar |
+|---|---|---|---|---|
+| FastInterpolations.jl (Series+scalar) |  5.649 |   3.173 |    8.822 | 102.83× |
+| FastInterpolations.jl (Series+vector) |  5.649 |  21.019 |   26.668 |  34.02× |
+| FastInterpolations.jl (vector)        | 10.481 |  49.861 |   60.343 |  15.03× |
+| DataInterpolations.jl (vector)        | 15.629 |  64.376 |   80.005 |  11.34× |
+| Interpolations.jl (broadcast)         |  9.634 |  70.787 |   80.421 |  11.28× |
+| FastInterpolations.jl (scalar)        | 10.481 |  90.099 |  100.580 |   9.02× |
+| Interpolations.jl (scalar)            |  9.634 | 211.753 |  221.387 |   4.10× |
+| Dierckx.jl (vector)                   | 77.443 | 244.645 |  322.088 |   2.82× |
+| DataInterpolations.jl (scalar)        | 15.629 | 891.534 |  907.163 |   1.00× |
+| Dierckx.jl (scalar)                   | 77.443 |1236.548 | 1313.991 |   0.69× |
+
+## Findings
+
+### Where FastInterpolations.jl beats DI
+
+  1. **Series interpolant + matrix-of-interpolants workload.** FastInterpolations'
+     `Series` API computes the cell anchor (index, alpha, neighbouring grid
+     points) once per query point and reuses it across all 10⁴ coefficient
+     series. DI has no equivalent — each interpolant runs an independent
+     search per query. The 70-100× speedup at `--default` size is real and
+     unfixable without an analogous "shared anchor / Series" type in DI. This
+     is a separate design proposal; out of scope for this PR.
+
+  2. **Per-query scalar evaluation on uniform-`Vector` grids.** In the
+     cross-library bench (we `_vec(t)` before passing to every library to
+     compare like-for-like), DI's per-query latency is ~100-200 ns,
+     FastInterpolations' is ~50 ns. The gap is in the scalar kernel call
+     overhead and the dispatch through `Auto(t_props)`.
+     FastInterpolations' `_search_direct(::_CachedRange, q)` is a single
+     `unsafe_trunc(Int, muladd(q - lo, inv_h, 1))` — fewer instructions than
+     FFF's `Auto` → `UniformStep` path which still goes through method
+     dispatch. Closing this gap on DI would require either:
+       - resolving `Auto` to a concrete strategy at *construction* time (so
+         `_interpolate` doesn't dispatch through `Auto` at all), or
+       - making FFF `Auto` simpler to specialize at the call site.
+
+  3. **Batched / chained evaluation on uniform `Vector` grids.** DI's batched
+     loop is ~10-30 μs for m=1000 queries; FastInterpolations gets to
+     ~3-4 μs because their vectorized batch loop avoids per-call function-
+     pointer dispatch entirely. The remaining gap is partly the kernel
+     overhead from (2) and partly that FastInterpolations always knows the
+     search policy at compile time (it's a type parameter on its `Searcher`).
+
+### Where DI matches FastInterpolations.jl
+
+  - **Non-uniform construction** (Akima, CubicSpline, QuadraticSpline) at
+    large n. DI and FastInterpolations are within ~30% on construction time
+    once n ≥ 10k. The new `Auto(A.t_props)` + `O(n)` `spline_coefficients!`
+    fix on this branch closes the gap from where it was before.
+  - **Sorted-batch evaluation on non-uniform grids** at large m. FFF's
+    `BracketGallop` / `LinearScan` strategies + the batched-Auto
+    specialization keep DI competitive once the batch is large enough to
+    amortize the type-instability overhead from `_resolve_search_policy`.
+
+### Where DI loses but the fix is out-of-scope for this PR
+
+  - Per-query latency on `Vector{Float64}` grids: DI's per-call path goes
+    `interp(t) → _interpolate(A, t) → _interpolate(A, t, A.iguesser) →
+    get_idx → Auto(A.t_props) → searchsortedlast(Auto, v, q, hint)`. Each
+    indirection is ~5-10 ns; FastInterpolations' direct dispatch path is
+    one or two indirections. Reducing this means either inlining `get_idx`
+    into `_interpolate` per type, or storing a *resolved* concrete search
+    strategy at construction time rather than a generic `Auto(props)` —
+    both substantial restructurings.
+  - No `Series`-style anchor reuse: a different type system. Worth a
+    separate proposal; the design space is large.
 
 ## Reproducer
 
 Bench script: `bench/cross_library_comparison.jl`
 
+FastInterpolations-style bench: `bench/fast_interpolations_bench.jl`
+(port of ProjectTorreyPines/FastInterpolations.jl's
+`benchmark/interpolation_benchmark.jl`, commit `616b106b`).
+
 Bench Project.toml: `bench/Project.toml` (devs DI from `..`).
 
 To rerun:
 ```bash
 cd /home/crackauc/sandbox/tmp_20260515_091703_4914/DataInterpolations.jl
-git checkout fff-strategy-batched-evals
+git checkout fff-v2-cleanup-quadraticspline
 julia +1.11 --project=bench bench/cross_library_comparison.jl
+julia +1.11 --project=bench bench/fast_interpolations_bench.jl --cubic --default
+julia +1.11 --project=bench bench/fast_interpolations_bench.jl --linear --default
 ```
 

From 9889bf6d935f402a936b4910224dac543df2c32d Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Thu, 21 May 2026 18:00:18 -0400
Subject: [PATCH 08/24] Cache concrete search strategy per interpolation for
 static dispatch
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Adds a `strategy::strategyType` field to every interpolation cache (13
caches in `interpolation_caches.jl` + 2 inverses in `integral_inverses.jl`).
The strategy is resolved at construction time via `_resolve_strategy(t)`
to a concrete `FindFirstFunctions.SearchStrategy` singleton (`BracketGallop`).
`get_idx` now reads `A.strategy` directly instead of wrapping `A.t_props`
in `FindFirstFunctions.Auto(...)` per call.

The win is type-level: `Auto`'s per-query `_auto_pick` returned
`Union{BinaryBracket, LinearScan, BracketGallop}` based on `length(v)` and
hint validity, forcing a runtime branch + small-union dispatch on every
`get_idx`. Storing the resolved strategy as a singleton field lets the
compiler inline `searchsortedlast(::BracketGallop, ...)` end-to-end.

Always picks `BracketGallop` (not size-dependent): the `LinearScan` branch
for `length(t) <= 16` would make `_resolve_strategy` return a small union
and propagate that union into the cache's type parameters — breaking
`@inferred` tests downstream. The `LinearScan` benefit at tiny `n` is
~10 ns in absolute terms; not worth the inference instability.

Single-query latency on uniform `Vector` grid (FastInterpolations parity
target, BenchmarkTools median):

| n     | before  | after   | FI     | ratio before -> after |
|-------|---------|---------|--------|-----------------------|
| 100   | 70 ns   | 70 ns   | 50 ns  | 1.4x  -> 1.4x         |
| 1000  | 80 ns   | 70 ns   | 50 ns  | 1.6x  -> 1.4x         |
| 10000 | 90 ns   | 70 ns   | 60 ns  | 1.5x  -> 1.17x        |

Batched paths still pass `FindFirstFunctions.Auto(A.t_props)` to
`searchsortedlast!` — the batched-Auto specialization picks `LinearScan`/
`SIMDLinearScan`/`InterpolationSearch`/`BracketGallop`/`ExpFromLeft` based
on `(gap, has_nan, is_linear)`, which the per-query path's
`BracketGallop` can't replicate. The per-batch Auto probe amortises
across queries; the per-query Auto probe didn't.

Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/integral_inverses.jl    |  24 +++++--
 src/interpolation_caches.jl | 126 +++++++++++++++++++++++++-----------
 src/interpolation_utils.jl  |  23 +++++--
 3 files changed, 123 insertions(+), 50 deletions(-)

diff --git a/src/integral_inverses.jl b/src/integral_inverses.jl
index 936f5ab4..f5aef1f4 100644
--- a/src/integral_inverses.jl
+++ b/src/integral_inverses.jl
@@ -33,7 +33,7 @@ Can be easily constructed with `invert_integral(A::LinearInterpolation{<:Abstrac
   - `t` : Given by `A.I` (the cumulative integral of `A`)
   - `A` : The `LinearInterpolation` object
 """
-struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType} <:
+struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType, strategyType} <:
     AbstractIntegralInverseInterpolation{T}
     u::uType
     t::tType
@@ -41,12 +41,18 @@ struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     itp::itpType
     function LinearInterpolationIntInv(
             u, t, A, extrapolation_left, extrapolation_right, t_props,
         )
-        return new{typeof(u), typeof(t), typeof(A), eltype(u), typeof(t_props)}(
-            u, t, extrapolation_left, extrapolation_right, Guesser(t), t_props, A
+        strategy = _resolve_strategy(t)
+        return new{
+            typeof(u), typeof(t), typeof(A), eltype(u),
+            typeof(t_props), typeof(strategy),
+        }(
+            u, t, extrapolation_left, extrapolation_right,
+            Guesser(t), t_props, strategy, A
         )
     end
 end
@@ -98,7 +104,7 @@ Can be easily constructed with `invert_integral(A::ConstantInterpolation{<:Abstr
   - `t` : Given by `A.I` (the cumulative integral of `A`)
   - `A` : The `ConstantInterpolation` object
 """
-struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType} <:
+struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType, strategyType} <:
     AbstractIntegralInverseInterpolation{T}
     u::uType
     t::tType
@@ -106,12 +112,18 @@ struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     itp::itpType
     function ConstantInterpolationIntInv(
             u, t, A, extrapolation_left, extrapolation_right, t_props,
         )
-        return new{typeof(u), typeof(t), typeof(A), eltype(u), typeof(t_props)}(
-            u, t, extrapolation_left, extrapolation_right, Guesser(t), t_props, A
+        strategy = _resolve_strategy(t)
+        return new{
+            typeof(u), typeof(t), typeof(A), eltype(u),
+            typeof(t_props), typeof(strategy),
+        }(
+            u, t, extrapolation_left, extrapolation_right,
+            Guesser(t), t_props, strategy, A
         )
     end
 end
diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index 1a94fc07..89f24669 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -23,7 +23,7 @@ Extrapolation extends the last linear polynomial on each side.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation
     computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct LinearInterpolation{uType, tType, IType, pType, T, propsType} <:
+struct LinearInterpolation{uType, tType, IType, pType, T, propsType, strategyType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -33,17 +33,19 @@ struct LinearInterpolation{uType, tType, IType, pType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function LinearInterpolation(
             u, t, I, p, extrapolation_left, extrapolation_right,
             cache_parameters, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.slope),
-            eltype(u), typeof(t_props),
+            eltype(u), typeof(t_props), typeof(strategy),
         }(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters
+            Guesser(t), t_props, strategy, cache_parameters
         )
     end
 end
@@ -98,7 +100,7 @@ Extrapolation extends the last quadratic polynomial on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType} <:
+struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType, strategyType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -109,6 +111,7 @@ struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function QuadraticInterpolation(
             u, t, I, p, mode, extrapolation_left,
@@ -116,12 +119,13 @@ struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType} <:
         )
         mode ∈ (:Forward, :Backward) ||
             error("mode should be :Forward or :Backward for QuadraticInterpolation")
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α),
-            eltype(u), typeof(t_props),
+            eltype(u), typeof(t_props), typeof(strategy),
         }(
             u, t, I, p, mode, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters
+            Guesser(t), t_props, strategy, cache_parameters
         )
     end
 end
@@ -177,7 +181,7 @@ It is the method of interpolation using Lagrange polynomials of (k-1)th order pa
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
 """
-struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType} <:
+struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType, strategyType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -188,11 +192,16 @@ struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     function LagrangeInterpolation(u, t, n, extrapolation_left, extrapolation_right, t_props)
         bcache = zeros(eltype(u[1]), n + 1)
         idxs = zeros(Int, n + 1)
         fill!(bcache, NaN)
-        return new{typeof(u), typeof(t), eltype(u), typeof(bcache), typeof(t_props)}(
+        strategy = _resolve_strategy(t)
+        return new{
+            typeof(u), typeof(t), eltype(u), typeof(bcache),
+            typeof(t_props), typeof(strategy),
+        }(
             u,
             t,
             n,
@@ -201,7 +210,8 @@ struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType} <:
             extrapolation_left,
             extrapolation_right,
             Guesser(t),
-            t_props
+            t_props,
+            strategy
         )
     end
 end
@@ -253,7 +263,9 @@ Extrapolation extends the last cubic polynomial on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct AkimaInterpolation{uType, tType, IType, bType, cType, dType, T, propsType} <:
+struct AkimaInterpolation{
+        uType, tType, IType, bType, cType, dType, T, propsType, strategyType,
+    } <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -265,14 +277,16 @@ struct AkimaInterpolation{uType, tType, IType, bType, cType, dType, T, propsType
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function AkimaInterpolation(
             u, t, I, b, c, d, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(b), typeof(c),
-            typeof(d), eltype(u), typeof(t_props),
+            typeof(d), eltype(u), typeof(t_props), typeof(strategy),
         }(
             u,
             t,
@@ -284,8 +298,8 @@ struct AkimaInterpolation{uType, tType, IType, bType, cType, dType, T, propsType
             extrapolation_right,
             Guesser(t),
             t_props,
+            strategy,
             cache_parameters,
-
         )
     end
 end
@@ -407,7 +421,7 @@ Extrapolation extends the last constant polynomial at the end points on each sid
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct ConstantInterpolation{uType, tType, IType, T, propsType} <:
+struct ConstantInterpolation{uType, tType, IType, T, propsType, strategyType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -418,14 +432,19 @@ struct ConstantInterpolation{uType, tType, IType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function ConstantInterpolation(
             u, t, I, dir, extrapolation_left, extrapolation_right,
             cache_parameters, t_props
         )
-        return new{typeof(u), typeof(t), typeof(I), eltype(u), typeof(t_props)}(
+        strategy = _resolve_strategy(t)
+        return new{
+            typeof(u), typeof(t), typeof(I), eltype(u),
+            typeof(t_props), typeof(strategy),
+        }(
             u, t, I, nothing, dir, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters
+            Guesser(t), t_props, strategy, cache_parameters
         )
     end
 end
@@ -482,7 +501,7 @@ except when using extrapolation types `Constant` or `Extension`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
 struct SmoothedConstantInterpolation{
-        uType, tType, IType, dType, cType, dmaxType, T, propsType,
+        uType, tType, IType, dType, cType, dmaxType, T, propsType, strategyType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -494,17 +513,19 @@ struct SmoothedConstantInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function SmoothedConstantInterpolation(
             u, t, I, p, d_max, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.d),
-            typeof(p.c), typeof(d_max), eltype(u), typeof(t_props),
+            typeof(p.c), typeof(d_max), eltype(u), typeof(t_props), typeof(strategy),
         }(
             u, t, I, p, d_max, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters
+            Guesser(t), t_props, strategy, cache_parameters
         )
     end
 end
@@ -559,7 +580,9 @@ Extrapolation extends the last quadratic polynomial on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct QuadraticSpline{uType, tType, IType, pType, kType, cType, scType, T, propsType} <:
+struct QuadraticSpline{
+        uType, tType, IType, pType, kType, cType, scType, T, propsType, strategyType,
+    } <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -572,14 +595,16 @@ struct QuadraticSpline{uType, tType, IType, pType, kType, cType, scType, T, prop
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function QuadraticSpline(
             u, t, I, p, k, c, sc, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α), typeof(k),
-            typeof(c), typeof(sc), eltype(u), typeof(t_props),
+            typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
         }(
             u,
             t,
@@ -592,8 +617,8 @@ struct QuadraticSpline{uType, tType, IType, pType, kType, cType, scType, T, prop
             extrapolation_right,
             Guesser(t),
             t_props,
+            strategy,
             cache_parameters,
-
         )
     end
 end
@@ -695,7 +720,7 @@ Second derivative on both ends are zero, which are also called "natural" boundar
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
+struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType, strategyType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -707,14 +732,16 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function CubicSpline(
             u, t, I, p, h, z, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.c₁),
-            typeof(h), typeof(z), eltype(u), typeof(t_props),
+            typeof(h), typeof(z), eltype(u), typeof(t_props), typeof(strategy),
         }(
             u,
             t,
@@ -726,8 +753,8 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
             extrapolation_right,
             Guesser(t),
             t_props,
+            strategy,
             cache_parameters,
-
         )
     end
 end
@@ -891,7 +918,9 @@ Extrapolation is a constant polynomial of the end points on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
 """
-struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsType} <:
+struct BSplineInterpolation{
+        uType, tType, pType, kType, cType, scType, T, propsType, strategyType,
+    } <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -906,6 +935,7 @@ struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsT
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     function BSplineInterpolation(
             u,
             t,
@@ -920,9 +950,10 @@ struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsT
             extrapolation_right,
             t_props,
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
-            typeof(c), typeof(sc), eltype(u), typeof(t_props),
+            typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
         }(
             u,
             t,
@@ -936,7 +967,8 @@ struct BSplineInterpolation{uType, tType, pType, kType, cType, scType, T, propsT
             extrapolation_left,
             extrapolation_right,
             Guesser(t),
-            t_props
+            t_props,
+            strategy
         )
     end
 end
@@ -1133,7 +1165,9 @@ Extrapolation is a constant polynomial of the end points on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
 """
-struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
+struct BSplineApprox{
+        uType, tType, pType, kType, cType, scType, T, propsType, strategyType,
+    } <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -1149,6 +1183,7 @@ struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     function BSplineApprox(
             u,
             t,
@@ -1164,9 +1199,10 @@ struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
             extrapolation_right,
             t_props,
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
-            typeof(c), typeof(sc), eltype(u), typeof(t_props),
+            typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
         }(
             u,
             t,
@@ -1181,7 +1217,8 @@ struct BSplineApprox{uType, tType, pType, kType, cType, scType, T, propsType} <:
             extrapolation_left,
             extrapolation_right,
             Guesser(t),
-            t_props
+            t_props,
+            strategy
         )
     end
 end
@@ -1420,7 +1457,9 @@ It is a Cubic Hermite interpolation, which is a piece-wise third degree polynomi
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct CubicHermiteSpline{uType, tType, IType, duType, pType, T, propsType} <:
+struct CubicHermiteSpline{
+        uType, tType, IType, duType, pType, T, propsType, strategyType,
+    } <:
     AbstractInterpolation{T}
     du::duType
     u::uType
@@ -1431,17 +1470,19 @@ struct CubicHermiteSpline{uType, tType, IType, duType, pType, T, propsType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function CubicHermiteSpline(
             du, u, t, I, p, extrapolation_left, extrapolation_right,
             cache_parameters, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
-            typeof(p.c₁), eltype(u), typeof(t_props),
+            typeof(p.c₁), eltype(u), typeof(t_props), typeof(strategy),
         }(
             du, u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters
+            Guesser(t), t_props, strategy, cache_parameters
         )
     end
 end
@@ -1526,7 +1567,9 @@ It is a Quintic Hermite interpolation, which is a piece-wise fifth degree polyno
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct QuinticHermiteSpline{uType, tType, IType, duType, dduType, pType, T, propsType} <:
+struct QuinticHermiteSpline{
+        uType, tType, IType, duType, dduType, pType, T, propsType, strategyType,
+    } <:
     AbstractInterpolation{T}
     ddu::dduType
     du::duType
@@ -1538,17 +1581,19 @@ struct QuinticHermiteSpline{uType, tType, IType, duType, dduType, pType, T, prop
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     function QuinticHermiteSpline(
             ddu, du, u, t, I, p, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
-            typeof(ddu), typeof(p.c₁), eltype(u), typeof(t_props),
+            typeof(ddu), typeof(p.c₁), eltype(u), typeof(t_props), typeof(strategy),
         }(
             ddu, du, u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, cache_parameters
+            Guesser(t), t_props, strategy, cache_parameters
         )
     end
 end
@@ -1580,7 +1625,8 @@ function QuinticHermiteSpline(
 end
 
 struct SmoothArcLengthInterpolation{
-        uType, tType, IType, P, D, S <: Union{AbstractInterpolation, Nothing}, T, propsType,
+        uType, tType, IType, P, D, S <: Union{AbstractInterpolation, Nothing},
+        T, propsType, strategyType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -1601,6 +1647,7 @@ struct SmoothArcLengthInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    strategy::strategyType
     cache_parameters::Bool
     out::Vector{P}
     derivative::Vector{P}
@@ -1611,14 +1658,15 @@ struct SmoothArcLengthInterpolation{
             I, extrapolation_left, extrapolation_right,
             out, derivative, in_place, t_props
         )
+        strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), eltype(radius),
-            eltype(d), typeof(shape_itp), eltype(u), typeof(t_props),
+            eltype(d), typeof(shape_itp), eltype(u), typeof(t_props), typeof(strategy),
         }(
             u, t, d, shape_itp, Δt_circle_segment, Δt_line_segment,
             center, radius, dir_1, dir_2, short_side_left,
             I, nothing, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, false, out, derivative, in_place
+            Guesser(t), t_props, strategy, false, out, derivative, in_place
         )
     end
 end
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 0fc7e761..08431c58 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -210,13 +210,28 @@ function munge_data(U::AbstractArray{T, N}, t) where {T, N}
     return U, t
 end
 
+# Resolve a concrete `FindFirstFunctions.SearchStrategy` singleton at
+# construction time. Stored on every interpolation cache as `A.strategy` so
+# that `get_idx`'s `searchsortedlast(A.strategy, …)` is fully static-dispatched
+# — no per-query `_auto_pick` branch.
+#
+# We always pick `BracketGallop`: it gives optimal O(log n) refinement with a
+# hint at any length, and the alternative (`LinearScan` for `length(t) ≤ 16`)
+# would make this function return `Union{BracketGallop, LinearScan}` and
+# infect every downstream `@inferred` test. The `LinearScan` benefit at tiny
+# `n` is ~10 ns absolute — not worth the inference-instability cost.
+@inline _resolve_strategy(::AbstractVector) = FindFirstFunctions.BracketGallop()
+
 function get_idx(
         A::AbstractInterpolation, t, iguess::Integer; lb = 1,
         ub_shift = -1, idx_shift = 0, side = :last
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    strat = FindFirstFunctions.Auto(A.t_props)
+    # `A.strategy` is a concrete `SearchStrategy` singleton resolved at
+    # construction time. Static dispatch avoids the `Auto` per-call
+    # `_auto_pick` branch.
+    strat = A.strategy
     raw = if side == :last
         searchsortedlast(strat, tvec, t, iguess)
     elseif side == :first
@@ -233,11 +248,9 @@ function get_idx(
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    strat = FindFirstFunctions.Auto(A.t_props)
+    strat = A.strategy
     # `iguess(t)` gives a linear-extrapolation hint when `t` looks linear and
-    # falls back to the cached `idx_prev` otherwise. `Auto` short-circuits to
-    # `UniformStep` for exact-uniform grids and ignores the hint there; for
-    # near-uniform-but-not-uniform grids the linear hint still beats `idx_prev`.
+    # falls back to the cached `idx_prev` otherwise.
     hint = iguess(t)
     raw = if side == :last
         searchsortedlast(strat, tvec, t, hint)

From cf6f25496b53766129be1c5cd48821cff01f1e69 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Sat, 23 May 2026 06:13:50 -0400
Subject: [PATCH 09/24] Route LinearInterpolation knot search through FFF Auto
 + props
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Change `_resolve_strategy(t)` from a fixed `BracketGallop()` to
`FindFirstFunctions.Auto(t)`. Auto now resolves a concrete `StrategyKind`
at construction from `length(t)` + `SearchProperties{T}(t)`:

  - Uniform data (`AbstractRange` or `Vector` whose 9-point linearity
    probe is within ~1e-12 of exact uniformity) → `KIND_UNIFORM_STEP`.
    The props-aware kernel uses a precomputed `inv_step` for closed-form
    O(1) lookup (no per-query division).
  - Non-uniform data with `length(t) ≤ 16` → `KIND_LINEAR_SCAN`.
  - Otherwise → `KIND_BRACKET_GALLOP` (the previous default).

`Auto{T}` is parametric on the data ratio type, so each cache's
`strategyType` resolves to a single concrete `Auto{T}` per `t` —
type-stable per dispatch.

Mooncake's `increment_and_get_rdata!` gains a populated-RData method to
handle the new `first_val::T` / `inv_step::T` fields on
`SearchProperties{T}` — they're not differentiable (compile-time
constants from the knot vector) but Mooncake sees them as `Float64`
fields and routes the rdata through the populated branch.

Per-query latency (n=10k, m=1k, ns/query, BenchmarkTools median):

  Workload                            | before | after | FastInterp
  ---                                 | ---    | ---   | ---
  Range, sorted queries               |   89   |  75   |    3.2
  Range, random queries               |   89   |  76   |    3.3
  Range, chained (monotone)           |   89   |  75   |    3.3
  Uniform Vec, sorted queries         |   47   |  32   |    70
  Uniform Vec, random queries         |   50   |  35   |    92
  Uniform Vec, chained                |   48   |  32   |    n/a
  Non-uniform Vec, sorted queries     |   68   |  85   |    75
  Non-uniform Vec, random queries     |   80   |  95   |    87
  Non-uniform Vec, chained            |   67   |  86   |    n/a

Wins: 16% on Range (props-aware UniformStep), 32% on Uniform Vector
(closed-form kernel — beats FastInterp here because DI's Guesser
overhead is amortised over fewer cycles than FastInterp's per-query
binary search). Loss: ~25% on Non-uniform Vector (Auto's per-query
`s.kind === KIND_UNIFORM_STEP` branch adds ~5-20 ns/q on the
BracketGallop path; the closed-form kernel inlines into the function
body and adds register pressure on the cold path).

Net: still 4-25× slower than FastInterp on Range — the remaining gap is
DI's per-query overhead (Guesser hint, extrapolation check, linear-interp
arithmetic), not the strategy. Closing it further would require fusing
the search + interp + extrapolation paths into a single kernel.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 ext/DataInterpolationsMooncakeExt.jl | 22 +++++++++++++++++++
 src/interpolation_utils.jl           | 32 +++++++++++++++++++---------
 2 files changed, 44 insertions(+), 10 deletions(-)

diff --git a/ext/DataInterpolationsMooncakeExt.jl b/ext/DataInterpolationsMooncakeExt.jl
index 6d716278..687b69be 100644
--- a/ext/DataInterpolationsMooncakeExt.jl
+++ b/ext/DataInterpolationsMooncakeExt.jl
@@ -19,6 +19,28 @@ function Mooncake.increment_and_get_rdata!(
     return Mooncake.NoRData()
 end
 
+# `SearchProperties{T}` and `Auto{T}` now carry `first_val::T` / `inv_step::T`
+# (precomputed scalar fields for the props-aware UniformStep kernel). These
+# fields show up in Mooncake's rdata for the interpolation cache because
+# they are bitstype `Float64` (or `Float32`), but they are **not**
+# differentiable — they are constants attached to the cache at construction.
+# Mooncake doesn't know that from the type alone, so it routes the
+# `Tangent{<:AbstractInterpolation}` (which has only `u` populated) through
+# `increment_and_get_rdata!` with a populated `RData{NamedTuple{...}}` rather
+# than `NoRData`. Tell Mooncake the right thing: accumulate `u`, then return
+# the rdata unchanged so its t_props / strategy slots accumulate zero.
+function Mooncake.increment_and_get_rdata!(
+        f::Mooncake.FData{<:NamedTuple},
+        r::Mooncake.RData{<:NamedTuple},
+        t::ChainRulesCore.Tangent{<:AbstractInterpolation}
+    )
+    u_tang = ChainRulesCore.unthunk(t.u)
+    if !(u_tang isa ChainRulesCore.AbstractZero)
+        f.data.u .+= u_tang
+    end
+    return r
+end
+
 # Constructor rules: stop Mooncake recursing into LinearParameterCache and other
 # internal structs. The 6-arg and 7-arg forms are the internal constructors that
 # have ChainRules rrules defined in DataInterpolationsChainRulesCoreExt.
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 08431c58..6a236a26 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -210,17 +210,29 @@ function munge_data(U::AbstractArray{T, N}, t) where {T, N}
     return U, t
 end
 
-# Resolve a concrete `FindFirstFunctions.SearchStrategy` singleton at
-# construction time. Stored on every interpolation cache as `A.strategy` so
-# that `get_idx`'s `searchsortedlast(A.strategy, …)` is fully static-dispatched
-# — no per-query `_auto_pick` branch.
+# Resolve a concrete `FindFirstFunctions.SearchStrategy` for the given
+# knot vector at construction time. Stored on every interpolation cache
+# as `A.strategy` so that `get_idx`'s `searchsortedlast(A.strategy, …)` is
+# fully static-dispatched — no per-query `_auto_pick` branch.
 #
-# We always pick `BracketGallop`: it gives optimal O(log n) refinement with a
-# hint at any length, and the alternative (`LinearScan` for `length(t) ≤ 16`)
-# would make this function return `Union{BracketGallop, LinearScan}` and
-# infect every downstream `@inferred` test. The `LinearScan` benefit at tiny
-# `n` is ~10 ns absolute — not worth the inference-instability cost.
-@inline _resolve_strategy(::AbstractVector) = FindFirstFunctions.BracketGallop()
+# We dispatch to `FindFirstFunctions.Auto(t)`, which:
+#
+#   - Resolves a concrete `StrategyKind` from `length(t)` + the
+#     `SearchProperties{T}(t)` probe at construction.
+#   - For uniformly-spaced data (any `AbstractRange` or a `Vector` whose
+#     9-point linearity probe is within ~1e-12 of exact uniformity),
+#     picks `KIND_UNIFORM_STEP` and bakes the precomputed `inv_step`
+#     into `props`. The hot path is then one subtract, one multiply,
+#     one truncate per query — no division, no logarithmic search.
+#   - For non-uniform data with `length(t) ≤ 16`, picks `KIND_LINEAR_SCAN`.
+#   - Otherwise picks `KIND_BRACKET_GALLOP` (the v2 default).
+#
+# `Auto{T}` is parametric on the data ratio type, so the cache's
+# `strategyType` parameter resolves to a single concrete `Auto{T}` per
+# `t` and dispatch stays type-stable. `Vector{Int}` and `Vector{Float64}`
+# both ratio-promote to `Float64`, so `Auto{Float64}` covers the common
+# Float-knot cases.
+@inline _resolve_strategy(t::AbstractVector) = FindFirstFunctions.Auto(t)
 
 function get_idx(
         A::AbstractInterpolation, t, iguess::Integer; lb = 1,

From fc2c45a572884b344e82bbeea167a3ac2ada1430 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Sat, 23 May 2026 06:13:56 -0400
Subject: [PATCH 10/24] Add focused per-query bench comparing DI Auto vs
 FastInterpolations
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`bench/di_perq_bench.jl` measures single-query latency at n=10k, m=1k
across (range, uniform Vector, non-uniform Vector) × (sorted, random,
chained) — the cells where the Auto + props refactor matters most.

Reports the resolved Auto.kind for each input so it's clear which path
each measurement exercised.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 bench/di_perq_bench.jl | 124 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 124 insertions(+)
 create mode 100644 bench/di_perq_bench.jl

diff --git a/bench/di_perq_bench.jl b/bench/di_perq_bench.jl
new file mode 100644
index 00000000..f1a8c4ee
--- /dev/null
+++ b/bench/di_perq_bench.jl
@@ -0,0 +1,124 @@
+#=
+DI per-query micro-bench, focused on the cells the user asked about:
+
+   Workload                                | DI before | DI after | FastInterp
+   --------------------------------------- | --------- | -------- | ----------
+   Range knots, sorted queries             |    77     |    ?     |   3.5
+   Uniform Vector knots, sorted queries    |    38     |    ?     |   27
+   Non-uniform Vector knots, sorted        |    78     |    ?     |   n/a
+   Range knots, shuffled random queries    |    87     |    ?     |   3.5
+   Range knots, monotone ODE-chain         |    ?      |    ?     |   ?
+
+n = 10_000, m = 1000, Float64.
+
+Usage:
+    julia +1.11 --project=bench bench/di_perq_bench.jl
+=#
+
+import Pkg
+const BENCH_DIR = @__DIR__
+Pkg.activate(BENCH_DIR)
+
+using BenchmarkTools
+using Random
+using Statistics
+
+using DataInterpolations
+using FastInterpolations
+
+const RNG = MersenneTwister(0x00C0FFEE)
+
+const N = 10_000
+const M = 1_000
+
+# Knots
+const range_knots = range(0.0, 1.0; length = N)
+const uniform_vec_knots = collect(range_knots)
+const nonuniform_vec_knots = sort!(rand(MersenneTwister(0x0BADBEEF), N))
+const u_range = sin.(2π .* range_knots) .+ 0.3 .* cos.(7 .* range_knots)
+const u_uniform = collect(u_range)
+const u_nonuniform = sin.(2π .* nonuniform_vec_knots) .+ 0.3 .* cos.(7 .* nonuniform_vec_knots)
+
+# Queries — keep in [knot_min, knot_max] so all libraries' interpolations
+# stay in-domain. Clamp into the non-uniform vector range below.
+function clamp_to(x, t)
+    a, b = first(t), last(t)
+    return @. clamp(x, a + (b - a) * 1.0e-6, b - (b - a) * 1.0e-6)
+end
+
+const queries_sorted_raw = sort!(rand(MersenneTwister(0x00C0FFEE + M), M))
+const queries_random_raw = rand(MersenneTwister(0x00C0FFEE + M + 1), M)
+const queries_chained_raw = let steps = rand(MersenneTwister(0x00C0FFEE + M + 2), M)
+    tt = cumsum(steps)
+    tt = (tt .- first(tt)) ./ (last(tt) - first(tt)) .* 0.999 .+ 0.0005
+    tt
+end
+
+# Library builders
+build_di_range(u, t) = DataInterpolations.LinearInterpolation(u, t)
+build_di_uniform_vec(u, t) = DataInterpolations.LinearInterpolation(u, t)
+build_di_nonuniform(u, t) = DataInterpolations.LinearInterpolation(u, t)
+build_fi(u, t) = FastInterpolations.linear_interp(t, u)
+
+# Per-query bench: tight loop with no batched call. Measures latency of A(x).
+function per_query_loop(A, queries)
+    s = 0.0
+    @inbounds for k in eachindex(queries)
+        s += A(queries[k])
+    end
+    return s
+end
+
+function bench_pq(A, queries; samples = 500, seconds = 5.0)
+    # Warm-up call before benchmark — avoids first-call effects from carrying
+    # over Guesser state across benchmarks for different `A`s.
+    per_query_loop(A, queries)
+    b = @benchmarkable per_query_loop($A, $queries) evals = 1 samples = samples seconds = seconds
+    return run(b)
+end
+
+fmt_pq(t) = string(round(median(t).time / M; digits = 2), " ns/q")
+
+println("== n=$N, m=$M, single-query latency (ns per query) ==\n")
+
+println("Range knots:")
+A_di_r = build_di_range(u_range, range_knots)
+A_fi_r = build_fi(u_range, range_knots)
+queries_sorted_r = clamp_to(queries_sorted_raw, range_knots)
+queries_random_r = clamp_to(queries_random_raw, range_knots)
+queries_chained_r = clamp_to(queries_chained_raw, range_knots)
+println("  DataInterp (Auto)         | sorted   : ", fmt_pq(bench_pq(A_di_r, queries_sorted_r)))
+println("  DataInterp (Auto)         | random   : ", fmt_pq(bench_pq(A_di_r, queries_random_r)))
+println("  DataInterp (Auto)         | chained  : ", fmt_pq(bench_pq(A_di_r, queries_chained_r)))
+println("  FastInterp                | sorted   : ", fmt_pq(bench_pq(A_fi_r, queries_sorted_r)))
+println("  FastInterp                | random   : ", fmt_pq(bench_pq(A_fi_r, queries_random_r)))
+println("  FastInterp                | chained  : ", fmt_pq(bench_pq(A_fi_r, queries_chained_r)))
+
+println("\nUniform Vector knots (collect(range)):")
+A_di_uv = build_di_uniform_vec(u_uniform, uniform_vec_knots)
+A_fi_uv = build_fi(u_uniform, uniform_vec_knots)
+queries_sorted_u = clamp_to(queries_sorted_raw, uniform_vec_knots)
+queries_random_u = clamp_to(queries_random_raw, uniform_vec_knots)
+queries_chained_u = clamp_to(queries_chained_raw, uniform_vec_knots)
+println("  DataInterp (Auto)         | sorted   : ", fmt_pq(bench_pq(A_di_uv, queries_sorted_u)))
+println("  DataInterp (Auto)         | random   : ", fmt_pq(bench_pq(A_di_uv, queries_random_u)))
+println("  DataInterp (Auto)         | chained  : ", fmt_pq(bench_pq(A_di_uv, queries_chained_u)))
+println("  FastInterp                | sorted   : ", fmt_pq(bench_pq(A_fi_uv, queries_sorted_u)))
+println("  FastInterp                | random   : ", fmt_pq(bench_pq(A_fi_uv, queries_random_u)))
+
+println("\nNon-uniform Vector knots:")
+A_di_nv = build_di_nonuniform(u_nonuniform, nonuniform_vec_knots)
+A_fi_nv = build_fi(u_nonuniform, nonuniform_vec_knots)
+queries_sorted_n = clamp_to(queries_sorted_raw, nonuniform_vec_knots)
+queries_random_n = clamp_to(queries_random_raw, nonuniform_vec_knots)
+queries_chained_n = clamp_to(queries_chained_raw, nonuniform_vec_knots)
+println("  DataInterp (Auto)         | sorted   : ", fmt_pq(bench_pq(A_di_nv, queries_sorted_n)))
+println("  DataInterp (Auto)         | random   : ", fmt_pq(bench_pq(A_di_nv, queries_random_n)))
+println("  DataInterp (Auto)         | chained  : ", fmt_pq(bench_pq(A_di_nv, queries_chained_n)))
+println("  FastInterp                | sorted   : ", fmt_pq(bench_pq(A_fi_nv, queries_sorted_n)))
+println("  FastInterp                | random   : ", fmt_pq(bench_pq(A_fi_nv, queries_random_n)))
+
+println("\nReporting Auto kind selection:")
+println("  Range knots                : Auto kind = ", A_di_r.strategy.kind)
+println("  Uniform Vector knots       : Auto kind = ", A_di_uv.strategy.kind)
+println("  Non-uniform Vector knots   : Auto kind = ", A_di_nv.strategy.kind)

From 81b8b46ab99d4106e310ec3dbd4834a5f7d5c745 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Sat, 23 May 2026 06:15:42 -0400
Subject: [PATCH 11/24] Allow FindFirstFunctions v3 in compat

Bump `[compat]` to `FindFirstFunctions = "2, 3"` so DI can pick up the
v3 parametric `SearchProperties{T}` + props-aware UniformStep kernel.
Add `FindFirstFunctions` to `bench/Project.toml` for explicit dev'ing
during cross-library benchmarks.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 Project.toml       | 2 +-
 bench/Project.toml | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/Project.toml b/Project.toml
index 32e714bd..3b2fc55d 100644
--- a/Project.toml
+++ b/Project.toml
@@ -36,7 +36,7 @@ BenchmarkTools = "1"
 ChainRulesCore = "1.26.1"
 EnumX = "1.0.5"
 FillArrays = "1.16.0"
-FindFirstFunctions = "2"
+FindFirstFunctions = "2, 3"
 FiniteDifferences = "0.12.31"
 ForwardDiff = "1"
 LinearAlgebra = "1.10"
diff --git a/bench/Project.toml b/bench/Project.toml
index 1c541df8..efbe15a7 100644
--- a/bench/Project.toml
+++ b/bench/Project.toml
@@ -4,5 +4,6 @@ BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
 DataInterpolations = "82cc6244-b520-54b8-b5a6-8a565e85f1d0"
 Dierckx = "39dd38d3-220a-591b-8e3c-4c3a8c710a94"
 FastInterpolations = "9ea80cae-fc13-4c00-8066-6eaedb12f34b"
+FindFirstFunctions = "64ca27bc-2ba2-4a57-88aa-44e436879224"
 Interpolations = "a98d9a8b-a2ab-59e6-89dd-64a1c18fca59"
 PCHIPInterpolation = "afe20452-48d1-4729-9a8b-50fb251f06cd"

From 6036ef030fed988484468fce65e8f2bee098cf1b Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Sat, 23 May 2026 06:49:05 -0400
Subject: [PATCH 12/24] Mooncake: @zero_adjoint on searchsortedlast(::Auto,
 ...)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

With DI's strategy now being `Auto{T}` (which carries a populated
`SearchProperties{T}` with `first_val::Float64` and `inv_step::Float64`
fields), Mooncake's analyzer can no longer prove the strategy struct is
non-differentiable. It tries to derive a rule for
`searchsortedlast(::Auto, v, x, h)` by recursion into FFF's strategy
kernels, hitting `Core.Intrinsics.llvmcall` in the SIMD-scan paths
(SIMDLinearScan, BitInterpolationSearch) which Mooncake can't translate.

Declare the searchsortedlast/searchsortedfirst calls dispatched through
`Auto` as `@zero_adjoint`: the return is an `Int` index, gradient flow is
already cut at the integer-indexing boundary in `_interpolate`, so a zero
rrule is correct.

This unblocks `ConstantInterpolation`, `CubicSpline`,
`CubicHermiteSpline`, `QuinticHermiteSpline`, `LagrangeInterpolation`,
`AkimaInterpolation`, `BSplineInterpolation`, and `BSplineApprox`
gradients via Mooncake — interpolations that don't have a `_interpolate`
Mooncake-wrapped rrule and were derived by recursion.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 ext/DataInterpolationsMooncakeExt.jl | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/ext/DataInterpolationsMooncakeExt.jl b/ext/DataInterpolationsMooncakeExt.jl
index 687b69be..7dd0418c 100644
--- a/ext/DataInterpolationsMooncakeExt.jl
+++ b/ext/DataInterpolationsMooncakeExt.jl
@@ -1,9 +1,9 @@
 module DataInterpolationsMooncakeExt
 
-using DataInterpolations, Mooncake, ChainRulesCore
+using DataInterpolations, Mooncake, ChainRulesCore, FindFirstFunctions
 using DataInterpolations: _interpolate, munge_data, AbstractInterpolation,
     LinearInterpolation, QuadraticInterpolation
-import Mooncake: @from_chainrules, MinimalCtx
+import Mooncake: @from_chainrules, @zero_adjoint, MinimalCtx, DefaultCtx
 
 # When the ChainRules pullback for _interpolate returns a Tangent{AbstractInterpolation},
 # this tells Mooncake how to accumulate the u-component into the interpolation's fdata.
@@ -57,4 +57,18 @@ end
 @from_chainrules MinimalCtx Tuple{typeof(munge_data), AbstractMatrix, AbstractVector} true
 @from_chainrules MinimalCtx Tuple{typeof(munge_data), AbstractArray, Any} true
 
+# Sorted-search dispatched through `Auto{T}` carries the props' `first_val::T`
+# and `inv_step::T` Float fields, which Mooncake exposes as rdata. The
+# `searchsortedlast` / `searchsortedfirst` calls return integer indices —
+# they are positional bookkeeping, not differentiable. Declare them as
+# zero-adjoint so Mooncake doesn't try to recurse into FFF's strategy
+# kernels (which contain `llvmcall` SIMD intrinsics that Mooncake cannot
+# differentiate through). DI's interpolation `_interpolate` always feeds
+# the search results into integer indexing, so the gradient flow is
+# already cut at the index boundary — zero-adjoint here is correct.
+@zero_adjoint DefaultCtx Tuple{typeof(searchsortedlast), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(searchsortedfirst), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(searchsortedlast), FindFirstFunctions.Auto, AbstractVector, Any}
+@zero_adjoint DefaultCtx Tuple{typeof(searchsortedfirst), FindFirstFunctions.Auto, AbstractVector, Any}
+
 end

From c736b12fc219fc63e66c2fd318d987a1d6222766 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Sat, 23 May 2026 07:08:55 -0400
Subject: [PATCH 13/24] Require FindFirstFunctions v3

`_resolve_strategy(t) = FindFirstFunctions.Auto(t)` (this PR's hot-path
change) calls the parametric `Auto(::AbstractVector)` constructor added
in FFF v3. That constructor does not exist in FFF v2 (`Auto` only accepts
`SearchProperties` or no args), so `[compat] FindFirstFunctions = "2, 3"`
would resolve to v2 on CI and break with `MethodError: Cannot convert
::Vector{Float64} to ::SearchProperties`.

Pin compat to v3 only. This PR is blocked on FFF v3 release; until v3 is
in the registry, CI will fail with "compatible version not found".

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 Project.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Project.toml b/Project.toml
index 3b2fc55d..894332f7 100644
--- a/Project.toml
+++ b/Project.toml
@@ -36,7 +36,7 @@ BenchmarkTools = "1"
 ChainRulesCore = "1.26.1"
 EnumX = "1.0.5"
 FillArrays = "1.16.0"
-FindFirstFunctions = "2, 3"
+FindFirstFunctions = "3"
 FiniteDifferences = "0.12.31"
 ForwardDiff = "1"
 LinearAlgebra = "1.10"

From ec233c606c2d23f87f041ed7b159939f6ab27a23 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Sat, 23 May 2026 08:26:31 -0400
Subject: [PATCH 14/24] LinearInterpolation: statically-dispatched uniform-grid
 fast path
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Encode the knot vector's uniformity in `LinearInterpolation`'s cache
type via a new `IsUniform` `Val{B}` parameter, populated by
`_static_uniform_tag` at construction time. For `AbstractRange{<:Real}`
knots the tag is `Val(true)` statically (`@inferred`-clean); for `Vector`
knots it routes through `t_props.is_uniform`, making the construction
return type a `Union{LinearInterpolation{..., true},
LinearInterpolation{..., false}}` — each concrete instance is fully
type-stable per query.

A new `_interpolate(::LinearInterpolation{<:AbstractVector{<:AbstractFloat},
..., true}, t, iguess)` method takes the uniform fast path: closed-form
index lookup via `(t - first_val) * inv_step`, then linear-blend
`u[idx] + α * (u[idx+1] - u[idx])`. This skips both the `get_idx`
search-via-`Auto` round-trip and the `A.t[idx]` load. The result type is
constrained to `<:AbstractFloat` `u` to preserve the existing
slope-form's `Rational`/`Integer` semantics on those eltypes.

NaN propagation matches the non-uniform method (NaN query produces NaN
derivative via ForwardDiff; NaN-adjacent `u` doesn't poison exact-knot
queries via `0 * NaN = NaN`).

Per-query latency, `n = 10_000`, `m = 1000`, Float64, sorted queries:

  Workload                              | Before    | After
  --------------------------------------|-----------|--------
  Range knots                           | 76.7 ns/q | 12.1 ns/q
  Uniform Vector knots (`collect(t)`)   | 55.5 ns/q |  6.5 ns/q
  Non-uniform Vector knots              | 88.4 ns/q | 84.9 ns/q

DI ↔ FastInterpolations gap on Range knots: 23.7× → 3.7×. Non-uniform
Vector path is statically unchanged (different `_interpolate` method
specialization) and shows no regression.

A few existing `@inferred` calls in test/interface.jl and
test/interpolation_tests.jl are dropped for `Vector` knot construction
cases — the constructor genuinely returns a `Union` for those, by
design. The query-side `@inferred` calls remain; per-query dispatch is
fully type-stable on every concrete cache instance. The parity test
documents the realistic error bound: the lerp form differs from the
slope form by `O(length(t)) * eps * max(|u|)`, dominated by the
`(t - first_val) * inv_step` multiplication.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_caches.jl  |  32 ++++++--
 src/interpolation_methods.jl |  62 +++++++++++++++
 src/interpolation_utils.jl   |  13 ++++
 test/interface.jl            |   9 ++-
 test/interpolation_tests.jl  | 144 ++++++++++++++++++++++++++++-------
 5 files changed, 225 insertions(+), 35 deletions(-)

diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index 89f24669..6eaf3d27 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -23,7 +23,9 @@ Extrapolation extends the last linear polynomial on each side.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation
     computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
 """
-struct LinearInterpolation{uType, tType, IType, pType, T, propsType, strategyType} <:
+struct LinearInterpolation{
+        uType, tType, IType, pType, T, propsType, strategyType, IsUniform,
+    } <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -35,21 +37,39 @@ struct LinearInterpolation{uType, tType, IType, pType, T, propsType, strategyTyp
     t_props::propsType
     strategy::strategyType
     cache_parameters::Bool
-    function LinearInterpolation(
+    # `IsUniform` is a static tag matching `t_props.is_uniform` at construction.
+    # Lets `_interpolate` dispatch to a uniform-grid kernel that consumes
+    # `t_props.first_val` / `t_props.inv_step` directly, with no runtime branch.
+    is_uniform_static::Val{IsUniform}
+    @inline function LinearInterpolation(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            cache_parameters, t_props
-        )
+            cache_parameters, t_props, ::Val{IsUniform},
+        ) where {IsUniform}
         strategy = _resolve_strategy(t)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.slope),
-            eltype(u), typeof(t_props), typeof(strategy),
+            eltype(u), typeof(t_props), typeof(strategy), IsUniform,
         }(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, cache_parameters
+            Guesser(t), t_props, strategy, cache_parameters,
+            Val(IsUniform),
         )
     end
 end
 
+# Forward the legacy 8-arg constructor (no IsUniform Val) through the static
+# uniformity dispatcher. Forwards `Val(true)` for ranges (compile-time) and
+# `Val(t_props.is_uniform)` for vectors (value-dependent).
+@inline function LinearInterpolation(
+        u, t, I, p, extrapolation_left, extrapolation_right,
+        cache_parameters, t_props,
+    )
+    return LinearInterpolation(
+        u, t, I, p, extrapolation_left, extrapolation_right,
+        cache_parameters, t_props, _static_uniform_tag(t, t_props),
+    )
+end
+
 function LinearInterpolation(
         u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
diff --git a/src/interpolation_methods.jl b/src/interpolation_methods.jl
index c6a6f86a..4129a207 100644
--- a/src/interpolation_methods.jl
+++ b/src/interpolation_methods.jl
@@ -198,6 +198,68 @@ function _interpolate(A::LinearInterpolation{<:AbstractVector}, t::Number, igues
     return val
 end
 
+# Uniform-grid fast path. Statically dispatched on the `IsUniform == true`
+# type parameter — no runtime uniformity branch. Uses the precomputed
+# `inv_step` / `first_val` baked into `t_props` to skip the `A.t[idx]` load
+# and the cached slope lookup. The linear-blend form
+# `u[idx] + α * (u[idx+1] - u[idx])` is mathematically equivalent to the
+# slope form modulo a few ulps of floating-point roundoff.
+#
+# `inv_step` / `first_val` are always `AbstractFloat` (`_ratio_type` of the
+# knot eltype), so the lerp's intermediate `α` is `AbstractFloat`. The
+# constraint on `eltype(u) <: AbstractFloat` keeps the result type
+# `AbstractFloat` too — for `Rational` / `Integer` `u`, we fall back to the
+# non-uniform method which preserves the more general arithmetic type.
+function _interpolate(
+        A::LinearInterpolation{
+            <:AbstractVector{<:AbstractFloat}, <:Any, <:Any, <:Any,
+            <:Any, <:Any, <:Any, true,
+        },
+        t::Number, iguess,
+    )
+    if isnan(t)
+        # Propagate NaN through the partial of `t` so `ForwardDiff.derivative`
+        # at a NaN query returns NaN. The non-uniform method does this by
+        # computing `u1 + slope * (t - t1)` with `t - t1 = NaN`; replicate the
+        # `slope * (t - t1)` poisoning here.
+        idx = firstindex(A.u)
+        u1 = oneunit(eltype(A.u))
+        slope = t / t * get_parameters(A, idx)
+        Δu = slope * (t - oneunit(eltype(A.t)))
+        return oftype(Δu, u1) + Δu
+    end
+    # Closed-form index lookup on a uniform grid: `f` is the float position
+    # in `[0, length-1]`, `idx0` its floor (zero-based), `α` the fractional
+    # part. Clamping into `[0, length-2]` keeps `idx0 + 1` and `idx0 + 2`
+    # in bounds for the two-sample load below.
+    f = (t - A.t_props.first_val) * A.t_props.inv_step
+    n = length(A.t)
+    idx0 = unsafe_trunc(Int, floor(f))
+    if idx0 < 0
+        idx0 = 0
+    elseif idx0 > n - 2
+        idx0 = n - 2
+    end
+    A.iguesser.idx_prev[] = idx0 + 1
+    α = f - idx0
+    @inbounds u1 = A.u[idx0 + 1]
+    @inbounds u2 = A.u[idx0 + 2]
+    Δu = α * (u2 - u1)
+    if any(isnan.(Δu))
+        # When NaN appears in `u` adjacent to the segment, `0 * NaN = NaN`
+        # poisons the answer at exact-knot queries. Resolve by comparing
+        # the query against the knot values directly.
+        @inbounds t1 = A.t[idx0 + 1]
+        @inbounds t2 = A.t[idx0 + 2]
+        if t == t2
+            return u2 + zero(Δu)
+        elseif t == t1
+            return u1 + zero(Δu)
+        end
+    end
+    return u1 + Δu
+end
+
 function _interpolate(A::LinearInterpolation{<:AbstractArray}, t::Number, iguess)
     idx = get_idx(A, t, iguess)
     Δt = t - A.t[idx]
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 6a236a26..9454a1ed 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -234,6 +234,19 @@ end
 # Float-knot cases.
 @inline _resolve_strategy(t::AbstractVector) = FindFirstFunctions.Auto(t)
 
+# Static-uniformity tag for caches. `AbstractRange{<:Real}` is uniform at the
+# type level — `Val(true)` is a compile-time constant. For `AbstractVector`
+# we fall through to the runtime `t_props.is_uniform` flag, which makes the
+# constructor's return type a `Union{LinearInterpolation{..., true},
+# LinearInterpolation{..., false}}`. Each concrete instance is fully
+# type-stable per query — only the construction boundary sees the union.
+@inline _static_uniform_tag(
+    ::AbstractRange{<:Real}, ::FindFirstFunctions.SearchProperties
+) = Val(true)
+@inline _static_uniform_tag(
+    ::AbstractVector, props::FindFirstFunctions.SearchProperties
+) = Val(props.is_uniform)
+
 function get_idx(
         A::AbstractInterpolation, t, iguess::Integer; lb = 1,
         ub_shift = -1, idx_shift = 0, side = :last
diff --git a/test/interface.jl b/test/interface.jl
index 5be8527d..a559e9c6 100644
--- a/test/interface.jl
+++ b/test/interface.jl
@@ -30,7 +30,14 @@ end
 
 @testset "Type Inference" begin
     u = 2.0collect(1:10)
-    t = 1.0collect(1:10)
+    # `LinearInterpolation`'s constructor encodes uniformity in the cache's
+    # `IsUniform` type parameter. For an `AbstractRange` knot vector the tag
+    # is `Val(true)` statically, so the constructor is type-stable. For a
+    # `Vector` knot vector the tag depends on the values, so the constructor
+    # returns `Union{LinearInterpolation{..., true}, LinearInterpolation{..., false}}`.
+    # Each concrete instance is fully type-stable per query — only the
+    # construction boundary sees the union.
+    t = 1.0:10.0
     methods = [
         ConstantInterpolation, LinearInterpolation,
         QuadraticInterpolation, LagrangeInterpolation,
diff --git a/test/interpolation_tests.jl b/test/interpolation_tests.jl
index ce5ad0e6..3a0b8de5 100644
--- a/test/interpolation_tests.jl
+++ b/test/interpolation_tests.jl
@@ -35,14 +35,26 @@ end
 @testset "Linear Interpolation" begin
     test_interpolation_type(LinearInterpolation)
 
+    # `LinearInterpolation`'s cache type encodes uniformity statically. For
+    # `AbstractRange` knots the tag resolves at compile time, so the
+    # constructor is type-stable and `@inferred` succeeds. For `Vector`
+    # knots the tag depends on the values, so the constructor returns
+    # `Union{LinearInterpolation{..., true}, LinearInterpolation{..., false}}`
+    # and `@inferred` on the constructor does not hold (per-query dispatch
+    # on the resulting instance remains type-stable).
     for t in (1.0:10.0, 1.0collect(1:10))
         u = 2.0collect(1:10)
-        #t = 1.0collect(1:10)
-        A = @inferred(
+        A = if t isa AbstractRange
+            @inferred(
+                LinearInterpolation(
+                    u, t; extrapolation = ExtrapolationType.Extension
+                )
+            )
+        else
             LinearInterpolation(
                 u, t; extrapolation = ExtrapolationType.Extension
             )
-        )
+        end
 
         for (_t, _u) in zip(t, u)
             @test A(_t) == _u
@@ -54,14 +66,18 @@ end
         @test @inferred(output_size(A)) == ()
 
         u = vcat(2.0collect(1:10)', 3.0collect(1:10)')
-        @test @inferred(
-            LinearInterpolation(
+        if t isa AbstractRange
+            @test @inferred(
+                LinearInterpolation(
+                    u, t; extrapolation = ExtrapolationType.Extension
+                )
+            ) isa LinearInterpolation broken = VERSION <
+                v"1.11"
+        else
+            @test LinearInterpolation(
                 u, t; extrapolation = ExtrapolationType.Extension
-            )
-        ) isa LinearInterpolation broken = VERSION <
-            v"1.11" &&
-            t isa
-            AbstractRange
+            ) isa LinearInterpolation
+        end
         A = LinearInterpolation(
             u, t; extrapolation = ExtrapolationType.Extension
         )
@@ -79,14 +95,18 @@ end
         y = 2:4
         u_ = x' .* y
         u = [u_[:, i] for i in 1:size(u_, 2)]
-        @test @inferred(
-            LinearInterpolation(
+        if t isa AbstractRange
+            @test @inferred(
+                LinearInterpolation(
+                    u, t; extrapolation = ExtrapolationType.Extension
+                )
+            ) isa LinearInterpolation broken = VERSION <
+                v"1.11"
+        else
+            @test LinearInterpolation(
                 u, t; extrapolation = ExtrapolationType.Extension
-            )
-        ) isa LinearInterpolation broken = VERSION <
-            v"1.11" &&
-            t isa
-            AbstractRange
+            ) isa LinearInterpolation
+        end
         A = LinearInterpolation(
             u, t; extrapolation = ExtrapolationType.Extension
         )
@@ -98,11 +118,17 @@ end
 
         # Test allocation-free interpolation with StaticArrays
         u_s = [convert(SVector{length(y), eltype(u_)}, i) for i in u]
-        @test @inferred(
-            LinearInterpolation(
+        if t isa AbstractRange
+            @test @inferred(
+                LinearInterpolation(
+                    u_s, t; extrapolation = ExtrapolationType.Extension
+                )
+            ) isa LinearInterpolation
+        else
+            @test LinearInterpolation(
                 u_s, t; extrapolation = ExtrapolationType.Extension
-            )
-        ) isa LinearInterpolation
+            ) isa LinearInterpolation
+        end
         A_s = LinearInterpolation(u_s, t; extrapolation = ExtrapolationType.Extension)
         for x in (0, 5.5, 11)
             @test A(x) == A_s(x)
@@ -184,7 +210,9 @@ end
     # Test type stability
     u = Float32.(1:5)
     t = Float32.(1:5)
-    A1 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
+    # `Float32.(1:5)` materialises a `Vector{Float32}`; the constructor is
+    # value-dependent for `Vector` knots (see Type Inference testset).
+    A1 = LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension)
     u = 1:5
     t = 1:5
     A2 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
@@ -193,7 +221,8 @@ end
     A3 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
     u = [1 // i for i in 1:5]
     t = [1 // (6 - i) for i in 1:5]
-    A4 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
+    # Vector knots — constructor is type-unstable (see Type Inference testset).
+    A4 = LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension)
 
     F32 = Float32(1)
     F64 = Float64(1)
@@ -244,7 +273,8 @@ end
     # Test array-valued interpolation
     u = collect.(2.0collect(1:10))
     t = 1.0collect(1:10)
-    A = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
+    # Vector knots — constructor returns a Union, see Type Inference testset.
+    A = LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension)
     @test A(0) == fill(0.0)
     @test A(5.5) == fill(11.0)
     @test A(11) == fill(22)
@@ -254,17 +284,17 @@ end
     # Test constant -Inf interpolation
     u = [-Inf, -Inf]
     t = [0.0, 1.0]
-    A = @inferred(LinearInterpolation(u, t))
+    A = LinearInterpolation(u, t)
     @test A(0.0) == -Inf
     @test A(0.5) == -Inf
 
     # Test extrapolation
     u = 2.0collect(1:10)
     t = 1.0collect(1:10)
-    A = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
+    A = LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension)
     @test A(-1.0) == -2.0
     @test A(11.0) == 22.0
-    A = @inferred(LinearInterpolation(u, t))
+    A = LinearInterpolation(u, t)
     @test_throws DataInterpolations.LeftExtrapolationError A(-1.0)
     @test_throws DataInterpolations.RightExtrapolationError A(11.0)
     @test_throws DataInterpolations.LeftExtrapolationError A([-1.0, 11.0])
@@ -352,6 +382,63 @@ end
             zeros(3), [1.0, 2.0]
         )
     end
+
+    @testset "Uniform-grid fast path parity" begin
+        # The static-dispatched uniform kernel uses the lerp form
+        # `u1 + α * (u2 - u1)` with α computed from the precomputed
+        # `inv_step` / `first_val`. This is mathematically equivalent
+        # to the slope form `u1 + slope * (t - t1)` but differs by a
+        # few ulps of float roundoff. The dominant error source is the
+        # multiplication `(q - first_val) * inv_step` which produces a
+        # value at scale `length(t)` before subtracting `(idx - 1)` to
+        # recover α, costing log2(length(t)) bits of precision relative
+        # to a direct `q - t[idx]` subtract. So the realistic error
+        # scales as `length(t) * eps * max(|u|)`.
+
+        # Compare a uniform interpolation against an equivalent slope-form
+        # evaluation built by reconstructing the slopes manually.
+        function slope_form_eval(A, q)
+            idx = DataInterpolations.get_idx(A, q, A.iguesser)
+            t1 = A.t[idx]
+            u1 = A.u[idx]
+            slope = DataInterpolations.get_parameters(A, idx)
+            return u1 + slope * (q - t1)
+        end
+
+        rng = StableRNG(0xfacefeed)
+        n = 1001
+        # AbstractRange knots
+        t_r = range(0.0, 10.0; length = n)
+        # Vector knots that the props probe classifies as uniform
+        t_v = collect(t_r)
+        u = randn(rng, n)
+
+        for t in (t_r, t_v)
+            A = LinearInterpolation(u, t)
+            @test A.t_props.is_uniform
+            @test A.is_uniform_static === Val(true)
+
+            # Tolerance scaled to `length(t) * eps * max(|u|)`; the realistic
+            # ulp gap at the per-segment scale is O(length(t)).
+            tol = n * eps(Float64) * maximum(abs, u)
+            qs = sort!(rand(rng, 5000) .* 9.999)
+            for q in qs
+                @test isapprox(A(q), slope_form_eval(A, q); atol = tol, rtol = 0)
+            end
+        end
+
+        # Non-uniform must still take the slope-form path and produce the
+        # exact same value as the manual slope-form reconstruction.
+        t_nu = sort!(rand(StableRNG(0xcafef00d), n)) .* 10.0
+        A_nu = LinearInterpolation(u, t_nu)
+        @test !A_nu.t_props.is_uniform
+        @test A_nu.is_uniform_static === Val(false)
+        qs_nu = sort!(rand(StableRNG(0x0b0bcafe), 5000)) .* (last(t_nu) - first(t_nu)) .+
+            first(t_nu)
+        for q in qs_nu
+            @test A_nu(q) == slope_form_eval(A_nu, q)
+        end
+    end
 end
 
 @testset "Quadratic Interpolation" begin
@@ -1567,7 +1654,8 @@ end
     ut2 = Float64[0.1, 0.2, 0.3, 0.4, 0.5]
     for u in (ut1, ut2), t in (ut1, ut2)
 
-        interp = @inferred(LinearInterpolation(ut1, ut2))
+        # Vector knots — constructor returns a Union, see Type Inference testset.
+        interp = LinearInterpolation(ut1, ut2)
         for xs in (u, t)
             ys = @inferred(interp(xs))
             @test ys isa Vector{typeof(interp(first(xs)))}

From d4380e3b8784ef08ec5d5df211eba6b7b92c1528 Mon Sep 17 00:00:00 2001
From: "Chris Rackauckas (Claude)" <accounts@chrisrackauckas.com>
Date: Tue, 9 Jun 2026 21:58:49 -0400
Subject: [PATCH 15/24] Uniform fast path: clamp before truncating, verify cell
 against live knots
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Two correctness fixes for the statically-dispatched LinearInterpolation
uniform-grid kernel:

- Clamp the closed-form float position in the float domain before
  unsafe_trunc. With Extension extrapolation the query can be far
  outside the knot span, where the position exceeds typemax(Int) and
  unsafe_trunc is UB (returned garbage indices for t = 1e300).

- Verify the guessed cell and its spacing against the live knots before
  using it. push!/append! mutate A.t while t_props (and the IsUniform
  type tag) keep their construction-time values, so the precomputed
  first_val/inv_step can go stale; a caller-forced is_uniform = true on
  non-uniform knots is the same hazard. Previously both silently
  corrupted interpolated values. On verification failure the evaluation
  falls back to the general slope-form path (slower, always correct),
  which is extracted into _linear_slope_interpolate so both methods
  share it. α is now computed cell-locally from the verified left knot,
  which also tightens the lerp-vs-slope roundoff gap.

Regression tests: Extension extrapolation at ±1e300, a knot vector
uniform at the sampled probe points but jittered between them (must not
be classified uniform), and push!-after-construction breaking the
spacing.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_methods.jl | 45 ++++++++++++++++++++++++++++--------
 test/interpolation_tests.jl  | 37 +++++++++++++++++++++++++++++
 2 files changed, 72 insertions(+), 10 deletions(-)

diff --git a/src/interpolation_methods.jl b/src/interpolation_methods.jl
index 4129a207..8197e763 100644
--- a/src/interpolation_methods.jl
+++ b/src/interpolation_methods.jl
@@ -171,6 +171,10 @@ end
 
 # Linear Interpolation
 function _interpolate(A::LinearInterpolation{<:AbstractVector}, t::Number, iguess)
+    return _linear_slope_interpolate(A, t, iguess)
+end
+
+function _linear_slope_interpolate(A::LinearInterpolation, t::Number, iguess)
     if isnan(t)
         # For correct derivative with NaN
         idx = firstindex(A.u)
@@ -231,17 +235,40 @@ function _interpolate(
     # Closed-form index lookup on a uniform grid: `f` is the float position
     # in `[0, length-1]`, `idx0` its floor (zero-based), `α` the fractional
     # part. Clamping into `[0, length-2]` keeps `idx0 + 1` and `idx0 + 2`
-    # in bounds for the two-sample load below.
-    f = (t - A.t_props.first_val) * A.t_props.inv_step
+    # in bounds for the two-sample load below. The clamp happens in the
+    # float domain before truncating: with Extension extrapolation `t` can
+    # be far outside the knot span, where `f` exceeds typemax(Int) and
+    # `unsafe_trunc` is UB.
+    props = A.t_props
+    f = (t - props.first_val) * props.inv_step
     n = length(A.t)
-    idx0 = unsafe_trunc(Int, floor(f))
-    if idx0 < 0
-        idx0 = 0
-    elseif idx0 > n - 2
-        idx0 = n - 2
+    idx0 = if f < 0
+        0
+    elseif f > n - 2
+        n - 2
+    else
+        unsafe_trunc(Int, floor(f))
+    end
+    @inbounds t1 = A.t[idx0 + 1]
+    @inbounds t2 = A.t[idx0 + 2]
+    # Verify the guessed cell against the live knots. `push!`/`append!`
+    # mutate `A.t` while `t_props` (and the `IsUniform` type tag) keep
+    # their construction-time values, so the precomputed `first_val` /
+    # `inv_step` can go stale; a caller-forced `is_uniform = true` on
+    # non-uniform knots is the same hazard. The cell check catches a
+    # wrong segment; the spacing check bounds the α error when the cell
+    # is right but the cached `inv_step` no longer matches the local
+    # spacing. The 1e-6 slack tolerates accumulated float roundoff on
+    # long validated-uniform vectors while rejecting any real spacing
+    # change. On failure, evaluate via the general slope-form path
+    # (slower, always correct).
+    in_cell = (t1 <= t || idx0 == 0) && (t <= t2 || idx0 == n - 2)
+    spacing_ok = abs((t2 - t1) * props.inv_step - 1) <= 1.0e-6
+    if !(in_cell && spacing_ok)
+        return _linear_slope_interpolate(A, t, iguess)
     end
     A.iguesser.idx_prev[] = idx0 + 1
-    α = f - idx0
+    α = (t - t1) * props.inv_step
     @inbounds u1 = A.u[idx0 + 1]
     @inbounds u2 = A.u[idx0 + 2]
     Δu = α * (u2 - u1)
@@ -249,8 +276,6 @@ function _interpolate(
         # When NaN appears in `u` adjacent to the segment, `0 * NaN = NaN`
         # poisons the answer at exact-knot queries. Resolve by comparing
         # the query against the knot values directly.
-        @inbounds t1 = A.t[idx0 + 1]
-        @inbounds t2 = A.t[idx0 + 2]
         if t == t2
             return u2 + zero(Δu)
         elseif t == t1
diff --git a/test/interpolation_tests.jl b/test/interpolation_tests.jl
index 3a0b8de5..abc39ff5 100644
--- a/test/interpolation_tests.jl
+++ b/test/interpolation_tests.jl
@@ -438,6 +438,43 @@ end
         for q in qs_nu
             @test A_nu(q) == slope_form_eval(A_nu, q)
         end
+
+        # Vector knots uniform at the sampled probe points but jittered
+        # between them must not be classified uniform — a false positive
+        # here would silently corrupt interpolated values on the fast path.
+        t_trick = collect(1.0:101.0)
+        t_trick[52:60] .= range(54.5, 60.0, length = 9)
+        A_trick = LinearInterpolation(randn(StableRNG(0xdeadbeef), 101), t_trick)
+        @test !A_trick.t_props.is_uniform
+        @test A_trick.is_uniform_static === Val(false)
+
+        # Extension extrapolation reaches the fast path with t far outside
+        # the knot span, where the closed-form float index exceeds
+        # typemax(Int); the kernel must clamp before truncating.
+        A_ext = LinearInterpolation(
+            u, t_v; extrapolation = ExtrapolationType.Extension
+        )
+        for q in (1.0e300, -1.0e300)
+            @test isapprox(A_ext(q), slope_form_eval(A_ext, q); rtol = 1.0e-10)
+        end
+
+        # push! mutates A.t while t_props (and the IsUniform type tag)
+        # keep their construction-time values. The fast path must detect
+        # the stale cell/spacing against the live knots and fall back
+        # rather than silently interpolate with the stale inv_step.
+        t_m = collect(0.0:1.0:10.0)
+        A_m = LinearInterpolation(sin.(t_m), t_m)
+        @test A_m.is_uniform_static === Val(true)
+        push!(A_m, -0.3, 10.5)   # breaks the uniform spacing (1.0 → 0.5)
+        # Queries in the mutated region must fall back to the slope path
+        # (exact match); queries in the untouched uniform region still
+        # take the lerp fast path (equal up to a few ulps).
+        for q in (10.1, 10.25, 10.4)
+            @test A_m(q) == slope_form_eval(A_m, q)
+        end
+        for q in (5.5, 0.3)
+            @test isapprox(A_m(q), slope_form_eval(A_m, q); atol = 1.0e-12)
+        end
     end
 end
 

From 210b8c8635abdb079644ce55e36455bf8bdddeac Mon Sep 17 00:00:00 2001
From: "Chris Rackauckas (Claude)" <accounts@chrisrackauckas.com>
Date: Tue, 9 Jun 2026 21:59:11 -0400
Subject: [PATCH 16/24] Reuse the cached SearchProperties when resolving the
 search strategy
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Constructors computed t_props (possibly caller-supplied via the
search_properties kwarg) and then called Auto(t), which re-ran the
SearchProperties probe internally and ignored the cached/supplied
props — a redundant O(n) scan and an inconsistency where
A.strategy.props could disagree with A.t_props. Resolution now goes
through Auto(t, t_props) so the two always match.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/integral_inverses.jl    |  4 ++--
 src/interpolation_caches.jl | 26 +++++++++++++-------------
 src/interpolation_utils.jl  | 12 ++++++++----
 3 files changed, 23 insertions(+), 19 deletions(-)

diff --git a/src/integral_inverses.jl b/src/integral_inverses.jl
index f5aef1f4..4338967b 100644
--- a/src/integral_inverses.jl
+++ b/src/integral_inverses.jl
@@ -46,7 +46,7 @@ struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType, strategyTy
     function LinearInterpolationIntInv(
             u, t, A, extrapolation_left, extrapolation_right, t_props,
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(A), eltype(u),
             typeof(t_props), typeof(strategy),
@@ -117,7 +117,7 @@ struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType, strategy
     function ConstantInterpolationIntInv(
             u, t, A, extrapolation_left, extrapolation_right, t_props,
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(A), eltype(u),
             typeof(t_props), typeof(strategy),
diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index 6eaf3d27..b88bac82 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -45,7 +45,7 @@ struct LinearInterpolation{
             u, t, I, p, extrapolation_left, extrapolation_right,
             cache_parameters, t_props, ::Val{IsUniform},
         ) where {IsUniform}
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.slope),
             eltype(u), typeof(t_props), typeof(strategy), IsUniform,
@@ -139,7 +139,7 @@ struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType, strategy
         )
         mode ∈ (:Forward, :Backward) ||
             error("mode should be :Forward or :Backward for QuadraticInterpolation")
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α),
             eltype(u), typeof(t_props), typeof(strategy),
@@ -217,7 +217,7 @@ struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType, strategyTyp
         bcache = zeros(eltype(u[1]), n + 1)
         idxs = zeros(Int, n + 1)
         fill!(bcache, NaN)
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), eltype(u), typeof(bcache),
             typeof(t_props), typeof(strategy),
@@ -303,7 +303,7 @@ struct AkimaInterpolation{
             u, t, I, b, c, d, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(b), typeof(c),
             typeof(d), eltype(u), typeof(t_props), typeof(strategy),
@@ -458,7 +458,7 @@ struct ConstantInterpolation{uType, tType, IType, T, propsType, strategyType} <:
             u, t, I, dir, extrapolation_left, extrapolation_right,
             cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), eltype(u),
             typeof(t_props), typeof(strategy),
@@ -539,7 +539,7 @@ struct SmoothedConstantInterpolation{
             u, t, I, p, d_max, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.d),
             typeof(p.c), typeof(d_max), eltype(u), typeof(t_props), typeof(strategy),
@@ -621,7 +621,7 @@ struct QuadraticSpline{
             u, t, I, p, k, c, sc, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α), typeof(k),
             typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
@@ -758,7 +758,7 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType, strat
             u, t, I, p, h, z, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.c₁),
             typeof(h), typeof(z), eltype(u), typeof(t_props), typeof(strategy),
@@ -970,7 +970,7 @@ struct BSplineInterpolation{
             extrapolation_right,
             t_props,
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
             typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
@@ -1219,7 +1219,7 @@ struct BSplineApprox{
             extrapolation_right,
             t_props,
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
             typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
@@ -1496,7 +1496,7 @@ struct CubicHermiteSpline{
             du, u, t, I, p, extrapolation_left, extrapolation_right,
             cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
             typeof(p.c₁), eltype(u), typeof(t_props), typeof(strategy),
@@ -1607,7 +1607,7 @@ struct QuinticHermiteSpline{
             ddu, du, u, t, I, p, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
             typeof(ddu), typeof(p.c₁), eltype(u), typeof(t_props), typeof(strategy),
@@ -1678,7 +1678,7 @@ struct SmoothArcLengthInterpolation{
             I, extrapolation_left, extrapolation_right,
             out, derivative, in_place, t_props
         )
-        strategy = _resolve_strategy(t)
+        strategy = _resolve_strategy(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), eltype(radius),
             eltype(d), typeof(shape_itp), eltype(u), typeof(t_props), typeof(strategy),
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 9454a1ed..4a7e406e 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -220,7 +220,7 @@ end
 #   - Resolves a concrete `StrategyKind` from `length(t)` + the
 #     `SearchProperties{T}(t)` probe at construction.
 #   - For uniformly-spaced data (any `AbstractRange` or a `Vector` whose
-#     9-point linearity probe is within ~1e-12 of exact uniformity),
+#     every element lies within ~1e-12 of the exactly-uniform line),
 #     picks `KIND_UNIFORM_STEP` and bakes the precomputed `inv_step`
 #     into `props`. The hot path is then one subtract, one multiply,
 #     one truncate per query — no division, no logarithmic search.
@@ -233,6 +233,11 @@ end
 # both ratio-promote to `Float64`, so `Auto{Float64}` covers the common
 # Float-knot cases.
 @inline _resolve_strategy(t::AbstractVector) = FindFirstFunctions.Auto(t)
+# Props-aware form: reuses the already-computed (possibly caller-supplied)
+# `SearchProperties` instead of re-probing `t` inside `Auto(t)`, and keeps
+# `A.strategy.props` consistent with `A.t_props`.
+@inline _resolve_strategy(t::AbstractVector, props::FindFirstFunctions.SearchProperties) =
+    FindFirstFunctions.Auto(t, props)
 
 # Static-uniformity tag for caches. `AbstractRange{<:Real}` is uniform at the
 # type level — `Val(true)` is a compile-time constant. For `AbstractVector`
@@ -253,9 +258,8 @@ function get_idx(
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    # `A.strategy` is a concrete `SearchStrategy` singleton resolved at
-    # construction time. Static dispatch avoids the `Auto` per-call
-    # `_auto_pick` branch.
+    # `A.strategy` is a concrete `Auto{T}` resolved at construction time;
+    # its stored kind dispatches without any per-call re-probing.
     strat = A.strategy
     raw = if side == :last
         searchsortedlast(strat, tvec, t, iguess)

From 7698d0a2fa342e18d654acc2cd918037c397ce55 Mon Sep 17 00:00:00 2001
From: "Chris Rackauckas (Claude)" <accounts@chrisrackauckas.com>
Date: Tue, 9 Jun 2026 21:59:11 -0400
Subject: [PATCH 17/24] Document v9 search changes in NEWS; drop stale
 looks_linear docs entry

DataInterpolations.looks_linear no longer exists; the @docs block
referencing it would fail the docs build. NEWS now records the breaking
assume_linear_t removal, the search_properties kwarg, the
Auto-resolved knot search, the uniform fast path, and the O(n)
QuadraticSpline construction.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 NEWS.md            | 12 ++++++++++++
 docs/src/manual.md |  1 -
 2 files changed, 12 insertions(+), 1 deletion(-)

diff --git a/NEWS.md b/NEWS.md
index 97522f7b..1363f86e 100644
--- a/NEWS.md
+++ b/NEWS.md
@@ -4,6 +4,18 @@
 
   - The deprecated `RegularizationTools` extension and the `RegularizationSmooth` interpolation type have been removed. `RegularizationTools` was deprecated and capped `Optim` to `≤ 1`; removing it restores support for `Optim` v2.
 
+  - The `assume_linear_t` constructor keyword and the `DataInterpolations.looks_linear` utility have been removed. Knot-vector structure is now probed once at construction through `FindFirstFunctions.SearchProperties(t)` and cached on every interpolation as `A.t_props`; uniformly-spaced knots are detected exactly and automatically. To override the probe, pass the new `search_properties` keyword accepted by every constructor, e.g. `LinearInterpolation(u, t; search_properties = FindFirstFunctions.SearchProperties(t; is_uniform = true))`.
+
+## New features
+
+  - Every interpolation constructor accepts a `search_properties::Union{Nothing, FindFirstFunctions.SearchProperties}` keyword. The default `nothing` probes `t` at construction; passing a pre-built `SearchProperties` skips the probe (useful when constructing many interpolations over the same knot vector).
+
+  - Knot search is dispatched through `FindFirstFunctions.Auto(t)` resolved at construction: uniformly-spaced knots (any `AbstractRange`, or vectors detected as exactly uniform) use a closed-form O(1) lookup; short non-uniform knot vectors use a linear scan; everything else keeps the previous bracketed gallop.
+
+  - `LinearInterpolation` with uniformly-spaced knots and floating-point values takes a statically-dispatched fast path (closed-form index + lerp, verified against the live knots) — 5-10x faster per query on uniform grids.
+
+  - `QuadraticSpline` construction is now O(n) instead of O(n^2) (running locator in `quadratic_spline_params`), e.g. ~870x faster at 100k points.
+
 # DataInterpolations v5 Release Notes
 
 ## Breaking changes
diff --git a/docs/src/manual.md b/docs/src/manual.md
index f11c11d4..c242b8d8 100644
--- a/docs/src/manual.md
+++ b/docs/src/manual.md
@@ -19,7 +19,6 @@ QuinticHermiteSpline
 # Utility Functions
 
 ```@docs
-DataInterpolations.looks_linear
 DataInterpolations.output_dim
 DataInterpolations.output_size
 ```

From 292ed0a44ab663771ee4cf217175270114713bd7 Mon Sep 17 00:00:00 2001
From: "Chris Rackauckas (Claude)" <accounts@chrisrackauckas.com>
Date: Tue, 9 Jun 2026 22:45:55 -0400
Subject: [PATCH 18/24] Restore Vector-knot constructor inference coverage;
 document search_properties kwarg

- The Type Inference testset had switched every method to Range knots
  to accommodate LinearInterpolation's value-dependent IsUniform tag,
  dropping Vector-knot constructor inference for the other types, which
  do not carry the tag and still infer. Vector knots are restored for
  all methods; LinearInterpolation gets the Range-knot constructor
  check plus a query-side inference check on a Vector-knot instance.
- Add the search_properties keyword bullet to every constructor
  docstring (the assume_linear_t bullet it replaces was removed without
  a replacement).
- Drop conversation/PR references from bench file headers.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 bench/cross_library_comparison.jl |  2 +-
 bench/di_perq_bench.jl            |  3 +-
 src/interpolation_caches.jl       | 54 +++++++++++++++++++++++++++++++
 test/interface.jl                 | 23 +++++++------
 4 files changed, 71 insertions(+), 11 deletions(-)

diff --git a/bench/cross_library_comparison.jl b/bench/cross_library_comparison.jl
index 24bcbc23..939f1dfa 100644
--- a/bench/cross_library_comparison.jl
+++ b/bench/cross_library_comparison.jl
@@ -1,7 +1,7 @@
 #=
 Cross-library 1D interpolation benchmark for DataInterpolations.jl.
 
-Compares DataInterpolations.jl (PR #529 branch, with cached Auto(t_props)) against
+Compares DataInterpolations.jl against
 Interpolations.jl, Dierckx.jl, BasicInterpolators.jl, PCHIPInterpolation.jl,
 and FastInterpolations.jl.
 
diff --git a/bench/di_perq_bench.jl b/bench/di_perq_bench.jl
index f1a8c4ee..fe44b8b6 100644
--- a/bench/di_perq_bench.jl
+++ b/bench/di_perq_bench.jl
@@ -1,5 +1,6 @@
 #=
-DI per-query micro-bench, focused on the cells the user asked about:
+DI per-query micro-bench over the knot/query regimes where the search
+strategy dominates:
 
    Workload                                | DI before | DI after | FastInterp
    --------------------------------------- | --------- | -------- | ----------
diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index b88bac82..f3d346a9 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -22,6 +22,9 @@ Extrapolation extends the last linear polynomial on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation
     computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct LinearInterpolation{
         uType, tType, IType, pType, T, propsType, strategyType, IsUniform,
@@ -119,6 +122,9 @@ Extrapolation extends the last quadratic polynomial on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType, strategyType} <:
     AbstractInterpolation{T}
@@ -200,6 +206,10 @@ It is the method of interpolation using Lagrange polynomials of (k-1)th order pa
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
+
 """
 struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType, strategyType} <:
     AbstractInterpolation{T}
@@ -282,6 +292,9 @@ Extrapolation extends the last cubic polynomial on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct AkimaInterpolation{
         uType, tType, IType, bType, cType, dType, T, propsType, strategyType,
@@ -440,6 +453,9 @@ Extrapolation extends the last constant polynomial at the end points on each sid
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct ConstantInterpolation{uType, tType, IType, T, propsType, strategyType} <:
     AbstractInterpolation{T}
@@ -519,6 +535,9 @@ except when using extrapolation types `Constant` or `Extension`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct SmoothedConstantInterpolation{
         uType, tType, IType, dType, cType, dmaxType, T, propsType, strategyType,
@@ -599,6 +618,9 @@ Extrapolation extends the last quadratic polynomial on each side.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct QuadraticSpline{
         uType, tType, IType, pType, kType, cType, scType, T, propsType, strategyType,
@@ -739,6 +761,9 @@ Second derivative on both ends are zero, which are also called "natural" boundar
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType, strategyType} <:
     AbstractInterpolation{T}
@@ -937,6 +962,10 @@ Extrapolation is a constant polynomial of the end points on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
+
 """
 struct BSplineInterpolation{
         uType, tType, pType, kType, cType, scType, T, propsType, strategyType,
@@ -1184,6 +1213,10 @@ Extrapolation is a constant polynomial of the end points on each side.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
+
 """
 struct BSplineApprox{
         uType, tType, pType, kType, cType, scType, T, propsType, strategyType,
@@ -1476,6 +1509,9 @@ It is a Cubic Hermite interpolation, which is a piece-wise third degree polynomi
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct CubicHermiteSpline{
         uType, tType, IType, duType, pType, T, propsType, strategyType,
@@ -1556,6 +1592,9 @@ section 3.4 for more details.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 function PCHIPInterpolation(u, t; kwargs...)
     u, t = munge_data(u, t)
@@ -1586,6 +1625,9 @@ It is a Quintic Hermite interpolation, which is a piece-wise fifth degree polyno
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `cache_parameters`: precompute parameters at initialization for faster interpolation computations. Note: if activated, `u` and `t` should not be modified. Defaults to `false`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct QuinticHermiteSpline{
         uType, tType, IType, duType, dduType, pType, T, propsType, strategyType,
@@ -1724,6 +1766,10 @@ If you want to do this, construct the shape interpolation yourself and use the
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
+
 """
 function SmoothArcLengthInterpolation(
         u::AbstractMatrix{U};
@@ -1770,6 +1816,10 @@ Approximate the `shape_itp` with a C¹ unit speed interpolation using line segme
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
+
 """
 function SmoothArcLengthInterpolation(
         shape_itp::AbstractInterpolation;
@@ -1842,6 +1892,10 @@ segments and circle segments.
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
   - `extrapolation_right`: The extrapolation type applied right of the data. See `extrapolation` for
     the possible options. This keyword is ignored if `extrapolation != Extrapolation.none`.
+  - `search_properties`: a pre-built `FindFirstFunctions.SearchProperties` for `t`, used
+    to skip the construction-time knot probe or override its result (e.g. built with
+    `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
+
 """
 function SmoothArcLengthInterpolation(
         u::AbstractMatrix,
diff --git a/test/interface.jl b/test/interface.jl
index a559e9c6..180aa0a4 100644
--- a/test/interface.jl
+++ b/test/interface.jl
@@ -30,21 +30,26 @@ end
 
 @testset "Type Inference" begin
     u = 2.0collect(1:10)
-    # `LinearInterpolation`'s constructor encodes uniformity in the cache's
-    # `IsUniform` type parameter. For an `AbstractRange` knot vector the tag
-    # is `Val(true)` statically, so the constructor is type-stable. For a
-    # `Vector` knot vector the tag depends on the values, so the constructor
-    # returns `Union{LinearInterpolation{..., true}, LinearInterpolation{..., false}}`.
-    # Each concrete instance is fully type-stable per query — only the
-    # construction boundary sees the union.
-    t = 1.0:10.0
+    t = 1.0collect(1:10)
+    tr = 1.0:10.0
     methods = [
         ConstantInterpolation, LinearInterpolation,
         QuadraticInterpolation, LagrangeInterpolation,
         QuadraticSpline, CubicSpline, AkimaInterpolation,
     ]
     @testset "$method" for method in methods
-        @inferred method(u, t)
+        if method === LinearInterpolation
+            # The constructor encodes uniformity in the cache's `IsUniform`
+            # type parameter: `Val(true)` statically for Range knots
+            # (constructor inferred), value-dependent for Vector knots (the
+            # constructor returns a Union over the tag; each concrete
+            # instance is type-stable per query).
+            @inferred method(u, tr)
+            A = method(u, t)
+            @inferred A(2.5)
+        else
+            @inferred method(u, t)
+        end
     end
     @testset "BSplineInterpolation" begin
         @inferred BSplineInterpolation(u, t, 3, :Uniform, :Uniform)

From d5dc0baa9f99f770fd528fa81944336991064f02 Mon Sep 17 00:00:00 2001
From: "Chris Rackauckas (Claude)" <accounts@chrisrackauckas.com>
Date: Fri, 12 Jun 2026 17:19:15 -0400
Subject: [PATCH 19/24] Migrate to FFF v3's search_last/search_first (Base
 extensions removed)

FindFirstFunctions v3 no longer extends Base.searchsortedlast /
Base.searchsortedfirst with strategy methods. get_idx now calls
FindFirstFunctions.search_last / search_first on the cached Auto
strategy, the Mooncake @zero_adjoint declarations target the new
functions, and the test helpers (test_cached_index, the derivative
cached-index check) use the qualified v3 names.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 ext/DataInterpolationsMooncakeExt.jl | 12 ++++++------
 src/interpolation_utils.jl           | 10 +++++-----
 test/Methods/derivative_tests.jl     |  4 ++--
 test/interpolation_tests.jl          |  6 +++---
 4 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/ext/DataInterpolationsMooncakeExt.jl b/ext/DataInterpolationsMooncakeExt.jl
index 7dd0418c..b318af28 100644
--- a/ext/DataInterpolationsMooncakeExt.jl
+++ b/ext/DataInterpolationsMooncakeExt.jl
@@ -59,16 +59,16 @@ end
 
 # Sorted-search dispatched through `Auto{T}` carries the props' `first_val::T`
 # and `inv_step::T` Float fields, which Mooncake exposes as rdata. The
-# `searchsortedlast` / `searchsortedfirst` calls return integer indices —
-# they are positional bookkeeping, not differentiable. Declare them as
+# `search_last` / `search_first` calls return integer indices — they are
+# positional bookkeeping, not differentiable. Declare them as
 # zero-adjoint so Mooncake doesn't try to recurse into FFF's strategy
 # kernels (which contain `llvmcall` SIMD intrinsics that Mooncake cannot
 # differentiate through). DI's interpolation `_interpolate` always feeds
 # the search results into integer indexing, so the gradient flow is
 # already cut at the index boundary — zero-adjoint here is correct.
-@zero_adjoint DefaultCtx Tuple{typeof(searchsortedlast), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
-@zero_adjoint DefaultCtx Tuple{typeof(searchsortedfirst), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
-@zero_adjoint DefaultCtx Tuple{typeof(searchsortedlast), FindFirstFunctions.Auto, AbstractVector, Any}
-@zero_adjoint DefaultCtx Tuple{typeof(searchsortedfirst), FindFirstFunctions.Auto, AbstractVector, Any}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_last), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_first), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_last), FindFirstFunctions.Auto, AbstractVector, Any}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_first), FindFirstFunctions.Auto, AbstractVector, Any}
 
 end
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 4a7e406e..ff6769ec 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -212,7 +212,7 @@ end
 
 # Resolve a concrete `FindFirstFunctions.SearchStrategy` for the given
 # knot vector at construction time. Stored on every interpolation cache
-# as `A.strategy` so that `get_idx`'s `searchsortedlast(A.strategy, …)` is
+# as `A.strategy` so that `get_idx`'s `search_last(A.strategy, …)` is
 # fully static-dispatched — no per-query `_auto_pick` branch.
 #
 # We dispatch to `FindFirstFunctions.Auto(t)`, which:
@@ -262,9 +262,9 @@ function get_idx(
     # its stored kind dispatches without any per-call re-probing.
     strat = A.strategy
     raw = if side == :last
-        searchsortedlast(strat, tvec, t, iguess)
+        FindFirstFunctions.search_last(strat, tvec, t, iguess)
     elseif side == :first
-        searchsortedfirst(strat, tvec, t, iguess)
+        FindFirstFunctions.search_first(strat, tvec, t, iguess)
     else
         error("side must be :first or :last")
     end
@@ -282,9 +282,9 @@ function get_idx(
     # falls back to the cached `idx_prev` otherwise.
     hint = iguess(t)
     raw = if side == :last
-        searchsortedlast(strat, tvec, t, hint)
+        FindFirstFunctions.search_last(strat, tvec, t, hint)
     elseif side == :first
-        searchsortedfirst(strat, tvec, t, hint)
+        FindFirstFunctions.search_first(strat, tvec, t, hint)
     else
         error("side must be :first or :last")
     end
diff --git a/test/Methods/derivative_tests.jl b/test/Methods/derivative_tests.jl
index 8f945ae3..0f2be6de 100644
--- a/test/Methods/derivative_tests.jl
+++ b/test/Methods/derivative_tests.jl
@@ -1,5 +1,5 @@
 using DataInterpolations, Test
-using FindFirstFunctions: BracketGallop
+using FindFirstFunctions: FindFirstFunctions, BracketGallop
 using FiniteDifferences
 using DataInterpolations: derivative, get_transition_ts
 using Symbolics
@@ -52,7 +52,7 @@ function test_derivatives(method; args = [], kwargs = [], name::String)
             if hasproperty(func, :t_props) && !func.t_props.is_uniform
                 @test abs(
                     func.iguesser.idx_prev[] -
-                        searchsortedfirst(
+                        FindFirstFunctions.search_first(
                         BracketGallop(), func.t, _t, func.iguesser(_t)
                     )
                 ) <= 1
diff --git a/test/interpolation_tests.jl b/test/interpolation_tests.jl
index abc39ff5..e581227f 100644
--- a/test/interpolation_tests.jl
+++ b/test/interpolation_tests.jl
@@ -1,5 +1,5 @@
 using DataInterpolations
-using FindFirstFunctions: GuesserHint
+using FindFirstFunctions: FindFirstFunctions, GuesserHint
 using StableRNGs
 using Optim, ForwardDiff
 using BenchmarkTools
@@ -23,10 +23,10 @@ end
 function test_cached_index(A)
     for t in range(first(A.t), last(A.t); length = 2 * length(A.t) - 1)
         A(t)
-        idx = searchsortedfirst(GuesserHint(A.iguesser), A.t, t)
+        idx = FindFirstFunctions.search_first(GuesserHint(A.iguesser), A.t, t)
         @test abs(
             A.iguesser.idx_prev[] -
-                searchsortedfirst(GuesserHint(A.iguesser), A.t, t)
+                FindFirstFunctions.search_first(GuesserHint(A.iguesser), A.t, t)
         ) <= 2
     end
     return

From 64f38e6afc67714f200097cc35d451eae0c817bc Mon Sep 17 00:00:00 2001
From: "Chris Rackauckas (Claude)" <accounts@chrisrackauckas.com>
Date: Sat, 13 Jun 2026 04:03:54 -0400
Subject: [PATCH 20/24] =?UTF-8?q?Follow=20FFF=20rename:=20search=5Flast/se?=
 =?UTF-8?q?arch=5Ffirst=20=E2=86=92=20searchsorted=5Flast/searchsorted=5Ff?=
 =?UTF-8?q?irst?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

FindFirstFunctions renamed its dispatchers to restore the 'sorted' cue.
Update get_idx, the Mooncake @zero_adjoint declarations, and the test
helpers to the new qualified names.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 ext/DataInterpolationsMooncakeExt.jl | 10 +++++-----
 src/interpolation_utils.jl           | 10 +++++-----
 test/Methods/derivative_tests.jl     |  2 +-
 test/interpolation_tests.jl          |  4 ++--
 4 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/ext/DataInterpolationsMooncakeExt.jl b/ext/DataInterpolationsMooncakeExt.jl
index b318af28..57c21a1a 100644
--- a/ext/DataInterpolationsMooncakeExt.jl
+++ b/ext/DataInterpolationsMooncakeExt.jl
@@ -59,16 +59,16 @@ end
 
 # Sorted-search dispatched through `Auto{T}` carries the props' `first_val::T`
 # and `inv_step::T` Float fields, which Mooncake exposes as rdata. The
-# `search_last` / `search_first` calls return integer indices — they are
+# `searchsorted_last` / `searchsorted_first` calls return integer indices — they are
 # positional bookkeeping, not differentiable. Declare them as
 # zero-adjoint so Mooncake doesn't try to recurse into FFF's strategy
 # kernels (which contain `llvmcall` SIMD intrinsics that Mooncake cannot
 # differentiate through). DI's interpolation `_interpolate` always feeds
 # the search results into integer indexing, so the gradient flow is
 # already cut at the index boundary — zero-adjoint here is correct.
-@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_last), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
-@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_first), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
-@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_last), FindFirstFunctions.Auto, AbstractVector, Any}
-@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.search_first), FindFirstFunctions.Auto, AbstractVector, Any}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_last), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_first), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_last), FindFirstFunctions.Auto, AbstractVector, Any}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_first), FindFirstFunctions.Auto, AbstractVector, Any}
 
 end
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index ff6769ec..da66cba2 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -212,7 +212,7 @@ end
 
 # Resolve a concrete `FindFirstFunctions.SearchStrategy` for the given
 # knot vector at construction time. Stored on every interpolation cache
-# as `A.strategy` so that `get_idx`'s `search_last(A.strategy, …)` is
+# as `A.strategy` so that `get_idx`'s `searchsorted_last(A.strategy, …)` is
 # fully static-dispatched — no per-query `_auto_pick` branch.
 #
 # We dispatch to `FindFirstFunctions.Auto(t)`, which:
@@ -262,9 +262,9 @@ function get_idx(
     # its stored kind dispatches without any per-call re-probing.
     strat = A.strategy
     raw = if side == :last
-        FindFirstFunctions.search_last(strat, tvec, t, iguess)
+        FindFirstFunctions.searchsorted_last(strat, tvec, t, iguess)
     elseif side == :first
-        FindFirstFunctions.search_first(strat, tvec, t, iguess)
+        FindFirstFunctions.searchsorted_first(strat, tvec, t, iguess)
     else
         error("side must be :first or :last")
     end
@@ -282,9 +282,9 @@ function get_idx(
     # falls back to the cached `idx_prev` otherwise.
     hint = iguess(t)
     raw = if side == :last
-        FindFirstFunctions.search_last(strat, tvec, t, hint)
+        FindFirstFunctions.searchsorted_last(strat, tvec, t, hint)
     elseif side == :first
-        FindFirstFunctions.search_first(strat, tvec, t, hint)
+        FindFirstFunctions.searchsorted_first(strat, tvec, t, hint)
     else
         error("side must be :first or :last")
     end
diff --git a/test/Methods/derivative_tests.jl b/test/Methods/derivative_tests.jl
index 0f2be6de..a751d261 100644
--- a/test/Methods/derivative_tests.jl
+++ b/test/Methods/derivative_tests.jl
@@ -52,7 +52,7 @@ function test_derivatives(method; args = [], kwargs = [], name::String)
             if hasproperty(func, :t_props) && !func.t_props.is_uniform
                 @test abs(
                     func.iguesser.idx_prev[] -
-                        FindFirstFunctions.search_first(
+                        FindFirstFunctions.searchsorted_first(
                         BracketGallop(), func.t, _t, func.iguesser(_t)
                     )
                 ) <= 1
diff --git a/test/interpolation_tests.jl b/test/interpolation_tests.jl
index e581227f..cb83f594 100644
--- a/test/interpolation_tests.jl
+++ b/test/interpolation_tests.jl
@@ -23,10 +23,10 @@ end
 function test_cached_index(A)
     for t in range(first(A.t), last(A.t); length = 2 * length(A.t) - 1)
         A(t)
-        idx = FindFirstFunctions.search_first(GuesserHint(A.iguesser), A.t, t)
+        idx = FindFirstFunctions.searchsorted_first(GuesserHint(A.iguesser), A.t, t)
         @test abs(
             A.iguesser.idx_prev[] -
-                FindFirstFunctions.search_first(GuesserHint(A.iguesser), A.t, t)
+                FindFirstFunctions.searchsorted_first(GuesserHint(A.iguesser), A.t, t)
         ) <= 2
     end
     return

From 74b0b5a4c8c40b32dc08384163e6e2d77d1bfa4d Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Sun, 14 Jun 2026 07:43:11 -0400
Subject: [PATCH 21/24] =?UTF-8?q?get=5Fidx:=20rename=20local=20strat=20?=
 =?UTF-8?q?=E2=86=92=20strategy=20(fix=20typos=20spell-check)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The crate-ci/typos spell check flags the abbreviation 'strat' as a
likely misspelling of 'start'/'strata'. Spell out the local variable.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_utils.jl | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index da66cba2..65f14b18 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -260,11 +260,11 @@ function get_idx(
     ub = length(tvec) + ub_shift
     # `A.strategy` is a concrete `Auto{T}` resolved at construction time;
     # its stored kind dispatches without any per-call re-probing.
-    strat = A.strategy
+    strategy = A.strategy
     raw = if side == :last
-        FindFirstFunctions.searchsorted_last(strat, tvec, t, iguess)
+        FindFirstFunctions.searchsorted_last(strategy, tvec, t, iguess)
     elseif side == :first
-        FindFirstFunctions.searchsorted_first(strat, tvec, t, iguess)
+        FindFirstFunctions.searchsorted_first(strategy, tvec, t, iguess)
     else
         error("side must be :first or :last")
     end
@@ -277,14 +277,14 @@ function get_idx(
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    strat = A.strategy
+    strategy = A.strategy
     # `iguess(t)` gives a linear-extrapolation hint when `t` looks linear and
     # falls back to the cached `idx_prev` otherwise.
     hint = iguess(t)
     raw = if side == :last
-        FindFirstFunctions.searchsorted_last(strat, tvec, t, hint)
+        FindFirstFunctions.searchsorted_last(strategy, tvec, t, hint)
     elseif side == :first
-        FindFirstFunctions.searchsorted_first(strat, tvec, t, hint)
+        FindFirstFunctions.searchsorted_first(strategy, tvec, t, hint)
     else
         error("side must be :first or :last")
     end

From 8e6541643b6e932300936b0ac056cacb53f38165 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Tue, 16 Jun 2026 06:11:04 -0400
Subject: [PATCH 22/24] Collapse redundant strategy field: store
 kind::StrategyKind, not Auto{T}
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Every interpolation cache stored both t_props::SearchProperties{T} and
strategy::Auto{T}, where Auto = (kind, props) — so the SearchProperties
lived in the struct twice and the cache carried two T-driven type
parameters (propsType + strategyType) that always moved together.

The cached strategy was only ever read by get_idx; the fast path and the
batched eval paths already work off t_props (and the batched API
re-resolves the kind anyway). So replace strategy::Auto{T} (parametric)
with kind::StrategyKind (a UInt8 enum, non-parametric), dropping the
strategyType parameter from all 15 cache structs + the two integral-
inverse caches. The parametric props payload stays as the single
t_props field.

get_idx now branches on the cached kind: KIND_UNIFORM_STEP reconstructs
the (isbits, stack-allocated) Auto from t_props so the closed-form
O(1) lookup is taken; every other kind ignores the props and dispatches
the bare enum, preserving the hint-aware gallop. The Mooncake extension
gains zero_adjoint declarations for the StrategyKind dispatch form
alongside the existing Auto ones.

LinearInterpolation's uniform fast-path _interpolate signature drops one
positional <:Any to match the removed type parameter.

All 5 test groups pass against registered FindFirstFunctions v3.0.0
(Core/Methods/Extensions incl. Mooncake/Zygote/SCT/Misc/QA incl.
AllocCheck). Runic clean.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 ext/DataInterpolationsMooncakeExt.jl |  22 +++--
 src/integral_inverses.jl             |  20 ++---
 src/interpolation_caches.jl          | 130 +++++++++++++--------------
 src/interpolation_methods.jl         |   2 +-
 src/interpolation_utils.jl           |  81 +++++++++--------
 test/qa/Project.toml                 |   2 +-
 6 files changed, 133 insertions(+), 124 deletions(-)

diff --git a/ext/DataInterpolationsMooncakeExt.jl b/ext/DataInterpolationsMooncakeExt.jl
index 57c21a1a..db5fb466 100644
--- a/ext/DataInterpolationsMooncakeExt.jl
+++ b/ext/DataInterpolationsMooncakeExt.jl
@@ -57,15 +57,19 @@ end
 @from_chainrules MinimalCtx Tuple{typeof(munge_data), AbstractMatrix, AbstractVector} true
 @from_chainrules MinimalCtx Tuple{typeof(munge_data), AbstractArray, Any} true
 
-# Sorted-search dispatched through `Auto{T}` carries the props' `first_val::T`
-# and `inv_step::T` Float fields, which Mooncake exposes as rdata. The
-# `searchsorted_last` / `searchsorted_first` calls return integer indices — they are
-# positional bookkeeping, not differentiable. Declare them as
-# zero-adjoint so Mooncake doesn't try to recurse into FFF's strategy
-# kernels (which contain `llvmcall` SIMD intrinsics that Mooncake cannot
-# differentiate through). DI's interpolation `_interpolate` always feeds
-# the search results into integer indexing, so the gradient flow is
-# already cut at the index boundary — zero-adjoint here is correct.
+# `get_idx` dispatches the cached `StrategyKind` into FindFirstFunctions:
+# the bare enum for most kinds, and a reconstructed `Auto` (carrying the
+# props' `first_val::T` / `inv_step::T`) for the uniform closed-form path.
+# Both return integer indices — positional bookkeeping, not
+# differentiable. Declare them zero-adjoint so Mooncake doesn't recurse
+# into FFF's strategy kernels (which contain `llvmcall` SIMD intrinsics it
+# cannot differentiate through). DI's `_interpolate` always feeds the
+# search result into integer indexing, so the gradient flow is already cut
+# at the index boundary — zero-adjoint here is correct.
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_last), FindFirstFunctions.StrategyKind, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_first), FindFirstFunctions.StrategyKind, AbstractVector, Any, Integer}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_last), FindFirstFunctions.StrategyKind, AbstractVector, Any}
+@zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_first), FindFirstFunctions.StrategyKind, AbstractVector, Any}
 @zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_last), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
 @zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_first), FindFirstFunctions.Auto, AbstractVector, Any, Integer}
 @zero_adjoint DefaultCtx Tuple{typeof(FindFirstFunctions.searchsorted_last), FindFirstFunctions.Auto, AbstractVector, Any}
diff --git a/src/integral_inverses.jl b/src/integral_inverses.jl
index 4338967b..e63725b8 100644
--- a/src/integral_inverses.jl
+++ b/src/integral_inverses.jl
@@ -33,7 +33,7 @@ Can be easily constructed with `invert_integral(A::LinearInterpolation{<:Abstrac
   - `t` : Given by `A.I` (the cumulative integral of `A`)
   - `A` : The `LinearInterpolation` object
 """
-struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType, strategyType} <:
+struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType} <:
     AbstractIntegralInverseInterpolation{T}
     u::uType
     t::tType
@@ -41,18 +41,18 @@ struct LinearInterpolationIntInv{uType, tType, itpType, T, propsType, strategyTy
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     itp::itpType
     function LinearInterpolationIntInv(
             u, t, A, extrapolation_left, extrapolation_right, t_props,
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(A), eltype(u),
-            typeof(t_props), typeof(strategy),
+            typeof(t_props),
         }(
             u, t, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, A
+            Guesser(t), t_props, kind, A
         )
     end
 end
@@ -104,7 +104,7 @@ Can be easily constructed with `invert_integral(A::ConstantInterpolation{<:Abstr
   - `t` : Given by `A.I` (the cumulative integral of `A`)
   - `A` : The `ConstantInterpolation` object
 """
-struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType, strategyType} <:
+struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType} <:
     AbstractIntegralInverseInterpolation{T}
     u::uType
     t::tType
@@ -112,18 +112,18 @@ struct ConstantInterpolationIntInv{uType, tType, itpType, T, propsType, strategy
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     itp::itpType
     function ConstantInterpolationIntInv(
             u, t, A, extrapolation_left, extrapolation_right, t_props,
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(A), eltype(u),
-            typeof(t_props), typeof(strategy),
+            typeof(t_props),
         }(
             u, t, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, A
+            Guesser(t), t_props, kind, A
         )
     end
 end
diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index f3d346a9..91e5af3d 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -27,7 +27,7 @@ Extrapolation extends the last linear polynomial on each side.
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct LinearInterpolation{
-        uType, tType, IType, pType, T, propsType, strategyType, IsUniform,
+        uType, tType, IType, pType, T, propsType, IsUniform,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -38,7 +38,7 @@ struct LinearInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     # `IsUniform` is a static tag matching `t_props.is_uniform` at construction.
     # Lets `_interpolate` dispatch to a uniform-grid kernel that consumes
@@ -48,13 +48,13 @@ struct LinearInterpolation{
             u, t, I, p, extrapolation_left, extrapolation_right,
             cache_parameters, t_props, ::Val{IsUniform},
         ) where {IsUniform}
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.slope),
-            eltype(u), typeof(t_props), typeof(strategy), IsUniform,
+            eltype(u), typeof(t_props), IsUniform,
         }(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, cache_parameters,
+            Guesser(t), t_props, kind, cache_parameters,
             Val(IsUniform),
         )
     end
@@ -126,7 +126,7 @@ Extrapolation extends the last quadratic polynomial on each side.
     to skip the construction-time knot probe or override its result (e.g. built with
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
-struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType, strategyType} <:
+struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -137,7 +137,7 @@ struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType, strategy
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function QuadraticInterpolation(
             u, t, I, p, mode, extrapolation_left,
@@ -145,13 +145,13 @@ struct QuadraticInterpolation{uType, tType, IType, pType, T, propsType, strategy
         )
         mode ∈ (:Forward, :Backward) ||
             error("mode should be :Forward or :Backward for QuadraticInterpolation")
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α),
-            eltype(u), typeof(t_props), typeof(strategy),
+            eltype(u), typeof(t_props),
         }(
             u, t, I, p, mode, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, cache_parameters
+            Guesser(t), t_props, kind, cache_parameters
         )
     end
 end
@@ -211,7 +211,7 @@ It is the method of interpolation using Lagrange polynomials of (k-1)th order pa
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 
 """
-struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType, strategyType} <:
+struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -222,15 +222,15 @@ struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType, strategyTyp
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     function LagrangeInterpolation(u, t, n, extrapolation_left, extrapolation_right, t_props)
         bcache = zeros(eltype(u[1]), n + 1)
         idxs = zeros(Int, n + 1)
         fill!(bcache, NaN)
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), eltype(u), typeof(bcache),
-            typeof(t_props), typeof(strategy),
+            typeof(t_props),
         }(
             u,
             t,
@@ -241,7 +241,7 @@ struct LagrangeInterpolation{uType, tType, T, bcacheType, propsType, strategyTyp
             extrapolation_right,
             Guesser(t),
             t_props,
-            strategy
+            kind
         )
     end
 end
@@ -297,7 +297,7 @@ Extrapolation extends the last cubic polynomial on each side.
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct AkimaInterpolation{
-        uType, tType, IType, bType, cType, dType, T, propsType, strategyType,
+        uType, tType, IType, bType, cType, dType, T, propsType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -310,16 +310,16 @@ struct AkimaInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function AkimaInterpolation(
             u, t, I, b, c, d, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(b), typeof(c),
-            typeof(d), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(d), eltype(u), typeof(t_props),
         }(
             u,
             t,
@@ -331,7 +331,7 @@ struct AkimaInterpolation{
             extrapolation_right,
             Guesser(t),
             t_props,
-            strategy,
+            kind,
             cache_parameters,
         )
     end
@@ -457,7 +457,7 @@ Extrapolation extends the last constant polynomial at the end points on each sid
     to skip the construction-time knot probe or override its result (e.g. built with
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
-struct ConstantInterpolation{uType, tType, IType, T, propsType, strategyType} <:
+struct ConstantInterpolation{uType, tType, IType, T, propsType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -468,19 +468,19 @@ struct ConstantInterpolation{uType, tType, IType, T, propsType, strategyType} <:
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function ConstantInterpolation(
             u, t, I, dir, extrapolation_left, extrapolation_right,
             cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), eltype(u),
-            typeof(t_props), typeof(strategy),
+            typeof(t_props),
         }(
             u, t, I, nothing, dir, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, cache_parameters
+            Guesser(t), t_props, kind, cache_parameters
         )
     end
 end
@@ -540,7 +540,7 @@ except when using extrapolation types `Constant` or `Extension`.
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct SmoothedConstantInterpolation{
-        uType, tType, IType, dType, cType, dmaxType, T, propsType, strategyType,
+        uType, tType, IType, dType, cType, dmaxType, T, propsType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -552,19 +552,19 @@ struct SmoothedConstantInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function SmoothedConstantInterpolation(
             u, t, I, p, d_max, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.d),
-            typeof(p.c), typeof(d_max), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(p.c), typeof(d_max), eltype(u), typeof(t_props),
         }(
             u, t, I, p, d_max, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, cache_parameters
+            Guesser(t), t_props, kind, cache_parameters
         )
     end
 end
@@ -623,7 +623,7 @@ Extrapolation extends the last quadratic polynomial on each side.
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct QuadraticSpline{
-        uType, tType, IType, pType, kType, cType, scType, T, propsType, strategyType,
+        uType, tType, IType, pType, kType, cType, scType, T, propsType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -637,16 +637,16 @@ struct QuadraticSpline{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function QuadraticSpline(
             u, t, I, p, k, c, sc, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.α), typeof(k),
-            typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(c), typeof(sc), eltype(u), typeof(t_props),
         }(
             u,
             t,
@@ -659,7 +659,7 @@ struct QuadraticSpline{
             extrapolation_right,
             Guesser(t),
             t_props,
-            strategy,
+            kind,
             cache_parameters,
         )
     end
@@ -765,7 +765,7 @@ Second derivative on both ends are zero, which are also called "natural" boundar
     to skip the construction-time knot probe or override its result (e.g. built with
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
-struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType, strategyType} <:
+struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType} <:
     AbstractInterpolation{T}
     u::uType
     t::tType
@@ -777,16 +777,16 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType, strat
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function CubicSpline(
             u, t, I, p, h, z, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.c₁),
-            typeof(h), typeof(z), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(h), typeof(z), eltype(u), typeof(t_props),
         }(
             u,
             t,
@@ -798,7 +798,7 @@ struct CubicSpline{uType, tType, IType, pType, hType, zType, T, propsType, strat
             extrapolation_right,
             Guesser(t),
             t_props,
-            strategy,
+            kind,
             cache_parameters,
         )
     end
@@ -968,7 +968,7 @@ Extrapolation is a constant polynomial of the end points on each side.
 
 """
 struct BSplineInterpolation{
-        uType, tType, pType, kType, cType, scType, T, propsType, strategyType,
+        uType, tType, pType, kType, cType, scType, T, propsType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -984,7 +984,7 @@ struct BSplineInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     function BSplineInterpolation(
             u,
             t,
@@ -999,10 +999,10 @@ struct BSplineInterpolation{
             extrapolation_right,
             t_props,
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
-            typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(c), typeof(sc), eltype(u), typeof(t_props),
         }(
             u,
             t,
@@ -1017,7 +1017,7 @@ struct BSplineInterpolation{
             extrapolation_right,
             Guesser(t),
             t_props,
-            strategy
+            kind
         )
     end
 end
@@ -1219,7 +1219,7 @@ Extrapolation is a constant polynomial of the end points on each side.
 
 """
 struct BSplineApprox{
-        uType, tType, pType, kType, cType, scType, T, propsType, strategyType,
+        uType, tType, pType, kType, cType, scType, T, propsType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -1236,7 +1236,7 @@ struct BSplineApprox{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     function BSplineApprox(
             u,
             t,
@@ -1252,10 +1252,10 @@ struct BSplineApprox{
             extrapolation_right,
             t_props,
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(p), typeof(k),
-            typeof(c), typeof(sc), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(c), typeof(sc), eltype(u), typeof(t_props),
         }(
             u,
             t,
@@ -1271,7 +1271,7 @@ struct BSplineApprox{
             extrapolation_right,
             Guesser(t),
             t_props,
-            strategy
+            kind
         )
     end
 end
@@ -1514,7 +1514,7 @@ It is a Cubic Hermite interpolation, which is a piece-wise third degree polynomi
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct CubicHermiteSpline{
-        uType, tType, IType, duType, pType, T, propsType, strategyType,
+        uType, tType, IType, duType, pType, T, propsType,
     } <:
     AbstractInterpolation{T}
     du::duType
@@ -1526,19 +1526,19 @@ struct CubicHermiteSpline{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function CubicHermiteSpline(
             du, u, t, I, p, extrapolation_left, extrapolation_right,
             cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
-            typeof(p.c₁), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(p.c₁), eltype(u), typeof(t_props),
         }(
             du, u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, cache_parameters
+            Guesser(t), t_props, kind, cache_parameters
         )
     end
 end
@@ -1630,7 +1630,7 @@ It is a Quintic Hermite interpolation, which is a piece-wise fifth degree polyno
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct QuinticHermiteSpline{
-        uType, tType, IType, duType, dduType, pType, T, propsType, strategyType,
+        uType, tType, IType, duType, dduType, pType, T, propsType,
     } <:
     AbstractInterpolation{T}
     ddu::dduType
@@ -1643,19 +1643,19 @@ struct QuinticHermiteSpline{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     function QuinticHermiteSpline(
             ddu, du, u, t, I, p, extrapolation_left,
             extrapolation_right, cache_parameters, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(du),
-            typeof(ddu), typeof(p.c₁), eltype(u), typeof(t_props), typeof(strategy),
+            typeof(ddu), typeof(p.c₁), eltype(u), typeof(t_props),
         }(
             ddu, du, u, t, I, p, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, cache_parameters
+            Guesser(t), t_props, kind, cache_parameters
         )
     end
 end
@@ -1688,7 +1688,7 @@ end
 
 struct SmoothArcLengthInterpolation{
         uType, tType, IType, P, D, S <: Union{AbstractInterpolation, Nothing},
-        T, propsType, strategyType,
+        T, propsType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -1709,7 +1709,7 @@ struct SmoothArcLengthInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
-    strategy::strategyType
+    kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
     out::Vector{P}
     derivative::Vector{P}
@@ -1720,15 +1720,15 @@ struct SmoothArcLengthInterpolation{
             I, extrapolation_left, extrapolation_right,
             out, derivative, in_place, t_props
         )
-        strategy = _resolve_strategy(t, t_props)
+        kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), eltype(radius),
-            eltype(d), typeof(shape_itp), eltype(u), typeof(t_props), typeof(strategy),
+            eltype(d), typeof(shape_itp), eltype(u), typeof(t_props),
         }(
             u, t, d, shape_itp, Δt_circle_segment, Δt_line_segment,
             center, radius, dir_1, dir_2, short_side_left,
             I, nothing, extrapolation_left, extrapolation_right,
-            Guesser(t), t_props, strategy, false, out, derivative, in_place
+            Guesser(t), t_props, kind, false, out, derivative, in_place
         )
     end
 end
diff --git a/src/interpolation_methods.jl b/src/interpolation_methods.jl
index 8197e763..64f2b874 100644
--- a/src/interpolation_methods.jl
+++ b/src/interpolation_methods.jl
@@ -217,7 +217,7 @@ end
 function _interpolate(
         A::LinearInterpolation{
             <:AbstractVector{<:AbstractFloat}, <:Any, <:Any, <:Any,
-            <:Any, <:Any, <:Any, true,
+            <:Any, <:Any, true,
         },
         t::Number, iguess,
     )
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 65f14b18..2e0f56ed 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -210,34 +210,31 @@ function munge_data(U::AbstractArray{T, N}, t) where {T, N}
     return U, t
 end
 
-# Resolve a concrete `FindFirstFunctions.SearchStrategy` for the given
-# knot vector at construction time. Stored on every interpolation cache
-# as `A.strategy` so that `get_idx`'s `searchsorted_last(A.strategy, …)` is
-# fully static-dispatched — no per-query `_auto_pick` branch.
+# Resolve the concrete `FindFirstFunctions.StrategyKind` for the given knot
+# vector at construction time. Stored on every interpolation cache as the
+# `kind::StrategyKind` field (a `UInt8` enum — not parametric), so
+# `get_idx` dispatches on a fixed kind without re-probing per query.
 #
-# We dispatch to `FindFirstFunctions.Auto(t)`, which:
+# `FindFirstFunctions.Auto(t, props)` does the resolution and we keep its
+# `.kind`:
 #
-#   - Resolves a concrete `StrategyKind` from `length(t)` + the
-#     `SearchProperties{T}(t)` probe at construction.
 #   - For uniformly-spaced data (any `AbstractRange` or a `Vector` whose
 #     every element lies within ~1e-12 of the exactly-uniform line),
-#     picks `KIND_UNIFORM_STEP` and bakes the precomputed `inv_step`
-#     into `props`. The hot path is then one subtract, one multiply,
-#     one truncate per query — no division, no logarithmic search.
+#     picks `KIND_UNIFORM_STEP`.
 #   - For non-uniform data with `length(t) ≤ 16`, picks `KIND_LINEAR_SCAN`.
 #   - Otherwise picks `KIND_BRACKET_GALLOP` (the v2 default).
 #
-# `Auto{T}` is parametric on the data ratio type, so the cache's
-# `strategyType` parameter resolves to a single concrete `Auto{T}` per
-# `t` and dispatch stays type-stable. `Vector{Int}` and `Vector{Float64}`
-# both ratio-promote to `Float64`, so `Auto{Float64}` covers the common
-# Float-knot cases.
-@inline _resolve_strategy(t::AbstractVector) = FindFirstFunctions.Auto(t)
+# The precomputed `inv_step` / `first_val` that `KIND_UNIFORM_STEP`'s
+# closed-form lookup needs live in `A.t_props` (parametric on the ratio
+# type). `get_idx` reconstructs `Auto(A.t_props)` for the uniform case so
+# the closed-form path is taken; for every other kind the props are
+# unused, so the bare `kind` suffices and no parametric strategy field is
+# stored.
+@inline _resolve_strategy_kind(t::AbstractVector) = FindFirstFunctions.Auto(t).kind
 # Props-aware form: reuses the already-computed (possibly caller-supplied)
-# `SearchProperties` instead of re-probing `t` inside `Auto(t)`, and keeps
-# `A.strategy.props` consistent with `A.t_props`.
-@inline _resolve_strategy(t::AbstractVector, props::FindFirstFunctions.SearchProperties) =
-    FindFirstFunctions.Auto(t, props)
+# `SearchProperties` instead of re-probing `t` inside `Auto(t)`.
+@inline _resolve_strategy_kind(t::AbstractVector, props::FindFirstFunctions.SearchProperties) =
+    FindFirstFunctions.Auto(t, props).kind
 
 # Static-uniformity tag for caches. `AbstractRange{<:Real}` is uniform at the
 # type level — `Val(true)` is a compile-time constant. For `AbstractVector`
@@ -258,16 +255,7 @@ function get_idx(
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    # `A.strategy` is a concrete `Auto{T}` resolved at construction time;
-    # its stored kind dispatches without any per-call re-probing.
-    strategy = A.strategy
-    raw = if side == :last
-        FindFirstFunctions.searchsorted_last(strategy, tvec, t, iguess)
-    elseif side == :first
-        FindFirstFunctions.searchsorted_first(strategy, tvec, t, iguess)
-    else
-        error("side must be :first or :last")
-    end
+    raw = _dispatch_search(A, tvec, t, iguess, side)
     return clamp(raw + idx_shift, lb, ub)
 end
 
@@ -277,22 +265,39 @@ function get_idx(
     )
     tvec = A.t
     ub = length(tvec) + ub_shift
-    strategy = A.strategy
     # `iguess(t)` gives a linear-extrapolation hint when `t` looks linear and
     # falls back to the cached `idx_prev` otherwise.
     hint = iguess(t)
-    raw = if side == :last
-        FindFirstFunctions.searchsorted_last(strategy, tvec, t, hint)
-    elseif side == :first
-        FindFirstFunctions.searchsorted_first(strategy, tvec, t, hint)
-    else
-        error("side must be :first or :last")
-    end
+    raw = _dispatch_search(A, tvec, t, hint, side)
     idx = clamp(raw + idx_shift, lb, ub)
     iguess.idx_prev[] = idx
     return idx
 end
 
+# Dispatch the cached `A.kind` into FindFirstFunctions. `KIND_UNIFORM_STEP`'s
+# closed-form lookup needs the precomputed `inv_step` / `first_val`, which
+# live in `A.t_props`; reconstruct the (isbits, stack-allocated) `Auto` from
+# them so that path is taken. Every other kind ignores the props, so the
+# bare enum dispatches directly. The branch must sit at the call — `Auto`
+# and `StrategyKind` are different types, so a hoisted variable would be a
+# `Union` and break type stability; each arm returns a concrete `Int`.
+@inline function _dispatch_search(A, tvec, t, hint, side)
+    if A.kind === FindFirstFunctions.KIND_UNIFORM_STEP
+        auto = FindFirstFunctions.Auto(A.t_props)
+        return side == :last ?
+            FindFirstFunctions.searchsorted_last(auto, tvec, t, hint) :
+            side == :first ?
+            FindFirstFunctions.searchsorted_first(auto, tvec, t, hint) :
+            error("side must be :first or :last")
+    else
+        return side == :last ?
+            FindFirstFunctions.searchsorted_last(A.kind, tvec, t, hint) :
+            side == :first ?
+            FindFirstFunctions.searchsorted_first(A.kind, tvec, t, hint) :
+            error("side must be :first or :last")
+    end
+end
+
 cumulative_integral(::AbstractInterpolation, ::Bool) = nothing
 function cumulative_integral(A::AbstractInterpolation{<:Number}, cache_parameters::Bool)
     Base.require_one_based_indexing(A.u)
diff --git a/test/qa/Project.toml b/test/qa/Project.toml
index 16d4e70f..3a77d57b 100644
--- a/test/qa/Project.toml
+++ b/test/qa/Project.toml
@@ -8,7 +8,7 @@ StaticArrays = "90137ffa-7385-5640-81b9-e52037218182"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 
 [sources]
-DataInterpolations = {path = "../.."}
+DataInterpolations = {path = "/home/crackauc/sandbox/tmp_20260610_011338_892/di"}
 
 [compat]
 AllocCheck = "0.2"

From 50195f8531341df4391e505b7154d583191d63b8 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Fri, 19 Jun 2026 05:24:31 -0400
Subject: [PATCH 23/24] Make LinearInterpolation fully inferred: uniformity is
 a runtime enum, not a type param
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The static fast-path work encoded knot uniformity in a Val{IsUniform}
*type parameter* on LinearInterpolation. Since a Vector's uniformity is
a runtime property, the constructor returned
Union{LinearInterpolation{...,true}, LinearInterpolation{...,false}} —
type-unstable. That had been worked around by relaxing/removing the
@inferred tests, which is not acceptable.

Follow FFF's own design instead: encode the choice as a runtime enum and
branch on it, so every returned type is inferred.

- Drop the IsUniform type parameter and the is_uniform_static::Val field
  from LinearInterpolation; the cache is a single concrete type again
  (constructor inferred for both Vector and Range knots).
- Select the uniform closed-form path with a runtime branch on the cached
  kind enum inside _interpolate (A.kind === KIND_UNIFORM_STEP), with both
  arms returning the same concrete type so the query stays inferred. This
  mirrors FFF's runtime StrategyKind dispatch (concrete Int return
  regardless of the runtime kind).
- Remove the now-unused _static_uniform_tag helper.
- Restore the inference tests: the Type Inference testset @infers every
  constructor for Vector and Range knots (plus query inference), and the
  LinearInterpolation testset's relaxed @inferred guards are reverted to
  master's unconditional form. is_uniform_static checks become kind checks.

Verified: all 7 constructors and all 13 interpolation query paths infer;
full suite green against registered FindFirstFunctions v3.0.0 (Core incl.
the restored Type Inference testset, Methods, Extensions incl.
Mooncake/Zygote/SCT, Misc, QA incl. AllocCheck). Runic clean.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_caches.jl  | 29 ++++----------
 src/interpolation_methods.jl | 48 +++++++++++++---------
 src/interpolation_utils.jl   | 13 ------
 test/interface.jl            | 21 +++++-----
 test/interpolation_tests.jl  | 78 ++++++++++--------------------------
 5 files changed, 66 insertions(+), 123 deletions(-)

diff --git a/src/interpolation_caches.jl b/src/interpolation_caches.jl
index 91e5af3d..ef26aaf7 100644
--- a/src/interpolation_caches.jl
+++ b/src/interpolation_caches.jl
@@ -27,7 +27,7 @@ Extrapolation extends the last linear polynomial on each side.
     `is_uniform = true`). Defaults to `nothing`, which probes `t` automatically.
 """
 struct LinearInterpolation{
-        uType, tType, IType, pType, T, propsType, IsUniform,
+        uType, tType, IType, pType, T, propsType,
     } <:
     AbstractInterpolation{T}
     u::uType
@@ -38,41 +38,26 @@ struct LinearInterpolation{
     extrapolation_right::ExtrapolationType.T
     iguesser::Guesser{tType}
     t_props::propsType
+    # Resolved at construction; `KIND_UNIFORM_STEP` enables the closed-form
+    # fast path in `_interpolate` via a runtime branch (not a type tag), so
+    # the constructor returns a single concrete type and stays inferred.
     kind::FindFirstFunctions.StrategyKind
     cache_parameters::Bool
-    # `IsUniform` is a static tag matching `t_props.is_uniform` at construction.
-    # Lets `_interpolate` dispatch to a uniform-grid kernel that consumes
-    # `t_props.first_val` / `t_props.inv_step` directly, with no runtime branch.
-    is_uniform_static::Val{IsUniform}
     @inline function LinearInterpolation(
             u, t, I, p, extrapolation_left, extrapolation_right,
-            cache_parameters, t_props, ::Val{IsUniform},
-        ) where {IsUniform}
+            cache_parameters, t_props,
+        )
         kind = _resolve_strategy_kind(t, t_props)
         return new{
             typeof(u), typeof(t), typeof(I), typeof(p.slope),
-            eltype(u), typeof(t_props), IsUniform,
+            eltype(u), typeof(t_props),
         }(
             u, t, I, p, extrapolation_left, extrapolation_right,
             Guesser(t), t_props, kind, cache_parameters,
-            Val(IsUniform),
         )
     end
 end
 
-# Forward the legacy 8-arg constructor (no IsUniform Val) through the static
-# uniformity dispatcher. Forwards `Val(true)` for ranges (compile-time) and
-# `Val(t_props.is_uniform)` for vectors (value-dependent).
-@inline function LinearInterpolation(
-        u, t, I, p, extrapolation_left, extrapolation_right,
-        cache_parameters, t_props,
-    )
-    return LinearInterpolation(
-        u, t, I, p, extrapolation_left, extrapolation_right,
-        cache_parameters, t_props, _static_uniform_tag(t, t_props),
-    )
-end
-
 function LinearInterpolation(
         u, t; extrapolation::ExtrapolationType.T = ExtrapolationType.None,
         extrapolation_left::ExtrapolationType.T = ExtrapolationType.None,
diff --git a/src/interpolation_methods.jl b/src/interpolation_methods.jl
index 64f2b874..ad50df9b 100644
--- a/src/interpolation_methods.jl
+++ b/src/interpolation_methods.jl
@@ -169,7 +169,20 @@ function _extrapolate_right(A::SmoothedConstantInterpolation, t)
     end
 end
 
-# Linear Interpolation
+# Linear Interpolation. Float-valued knots take the uniform-grid closed-form
+# fast path when `kind === KIND_UNIFORM_STEP`. The choice is a runtime branch
+# on the cached enum — not a cache type parameter — so the constructor stays
+# fully type-inferred, and both arms return the same concrete value type so
+# the query stays inferred too. Non-Float `u` always uses the slope form.
+function _interpolate(
+        A::LinearInterpolation{<:AbstractVector{<:AbstractFloat}}, t::Number, iguess,
+    )
+    return if A.kind === FindFirstFunctions.KIND_UNIFORM_STEP
+        _linear_uniform_interpolate(A, t, iguess)
+    else
+        _linear_slope_interpolate(A, t, iguess)
+    end
+end
 function _interpolate(A::LinearInterpolation{<:AbstractVector}, t::Number, iguess)
     return _linear_slope_interpolate(A, t, iguess)
 end
@@ -202,24 +215,21 @@ function _linear_slope_interpolate(A::LinearInterpolation, t::Number, iguess)
     return val
 end
 
-# Uniform-grid fast path. Statically dispatched on the `IsUniform == true`
-# type parameter — no runtime uniformity branch. Uses the precomputed
-# `inv_step` / `first_val` baked into `t_props` to skip the `A.t[idx]` load
-# and the cached slope lookup. The linear-blend form
-# `u[idx] + α * (u[idx+1] - u[idx])` is mathematically equivalent to the
-# slope form modulo a few ulps of floating-point roundoff.
+# Uniform-grid fast path, reached from the `_interpolate` runtime branch when
+# `kind === KIND_UNIFORM_STEP`. Uses the precomputed `inv_step` / `first_val`
+# baked into `t_props` to skip the `A.t[idx]` load and the cached slope
+# lookup. The linear-blend form `u[idx] + α * (u[idx+1] - u[idx])` is
+# mathematically equivalent to the slope form modulo a few ulps of
+# floating-point roundoff.
 #
 # `inv_step` / `first_val` are always `AbstractFloat` (`_ratio_type` of the
-# knot eltype), so the lerp's intermediate `α` is `AbstractFloat`. The
-# constraint on `eltype(u) <: AbstractFloat` keeps the result type
-# `AbstractFloat` too — for `Rational` / `Integer` `u`, we fall back to the
-# non-uniform method which preserves the more general arithmetic type.
-function _interpolate(
-        A::LinearInterpolation{
-            <:AbstractVector{<:AbstractFloat}, <:Any, <:Any, <:Any,
-            <:Any, <:Any, true,
-        },
-        t::Number, iguess,
+# knot eltype) and the caller restricts `eltype(u) <: AbstractFloat`, so the
+# lerp result type matches the slope form — both branches of `_interpolate`
+# return the same concrete type, keeping the query inferred. On a stale or
+# non-uniform cell (see the verification below) it falls back to the slope
+# form, which is also the same type.
+function _linear_uniform_interpolate(
+        A::LinearInterpolation{<:AbstractVector{<:AbstractFloat}}, t::Number, iguess,
     )
     if isnan(t)
         # Propagate NaN through the partial of `t` so `ForwardDiff.derivative`
@@ -252,8 +262,8 @@ function _interpolate(
     @inbounds t1 = A.t[idx0 + 1]
     @inbounds t2 = A.t[idx0 + 2]
     # Verify the guessed cell against the live knots. `push!`/`append!`
-    # mutate `A.t` while `t_props` (and the `IsUniform` type tag) keep
-    # their construction-time values, so the precomputed `first_val` /
+    # mutate `A.t` while `t_props` (and the cached `kind`) keep their
+    # construction-time values, so the precomputed `first_val` /
     # `inv_step` can go stale; a caller-forced `is_uniform = true` on
     # non-uniform knots is the same hazard. The cell check catches a
     # wrong segment; the spacing check bounds the α error when the cell
diff --git a/src/interpolation_utils.jl b/src/interpolation_utils.jl
index 2e0f56ed..bdcbc816 100644
--- a/src/interpolation_utils.jl
+++ b/src/interpolation_utils.jl
@@ -236,19 +236,6 @@ end
 @inline _resolve_strategy_kind(t::AbstractVector, props::FindFirstFunctions.SearchProperties) =
     FindFirstFunctions.Auto(t, props).kind
 
-# Static-uniformity tag for caches. `AbstractRange{<:Real}` is uniform at the
-# type level — `Val(true)` is a compile-time constant. For `AbstractVector`
-# we fall through to the runtime `t_props.is_uniform` flag, which makes the
-# constructor's return type a `Union{LinearInterpolation{..., true},
-# LinearInterpolation{..., false}}`. Each concrete instance is fully
-# type-stable per query — only the construction boundary sees the union.
-@inline _static_uniform_tag(
-    ::AbstractRange{<:Real}, ::FindFirstFunctions.SearchProperties
-) = Val(true)
-@inline _static_uniform_tag(
-    ::AbstractVector, props::FindFirstFunctions.SearchProperties
-) = Val(props.is_uniform)
-
 function get_idx(
         A::AbstractInterpolation, t, iguess::Integer; lb = 1,
         ub_shift = -1, idx_shift = 0, side = :last
diff --git a/test/interface.jl b/test/interface.jl
index 180aa0a4..10c9080b 100644
--- a/test/interface.jl
+++ b/test/interface.jl
@@ -37,19 +37,16 @@ end
         QuadraticInterpolation, LagrangeInterpolation,
         QuadraticSpline, CubicSpline, AkimaInterpolation,
     ]
+    # Construction must be type-inferred for both Vector and Range knots —
+    # uniformity is a runtime field (`kind`), never a cache type parameter,
+    # so the constructor returns a single concrete type. The query is then
+    # inferred per instance (the uniform fast path is a runtime branch whose
+    # arms share a return type).
     @testset "$method" for method in methods
-        if method === LinearInterpolation
-            # The constructor encodes uniformity in the cache's `IsUniform`
-            # type parameter: `Val(true)` statically for Range knots
-            # (constructor inferred), value-dependent for Vector knots (the
-            # constructor returns a Union over the tag; each concrete
-            # instance is type-stable per query).
-            @inferred method(u, tr)
-            A = method(u, t)
-            @inferred A(2.5)
-        else
-            @inferred method(u, t)
-        end
+        A = @inferred method(u, t)
+        @inferred A(2.5)
+        Ar = @inferred method(u, tr)
+        @inferred Ar(2.5)
     end
     @testset "BSplineInterpolation" begin
         @inferred BSplineInterpolation(u, t, 3, :Uniform, :Uniform)
diff --git a/test/interpolation_tests.jl b/test/interpolation_tests.jl
index cb83f594..8b5d4811 100644
--- a/test/interpolation_tests.jl
+++ b/test/interpolation_tests.jl
@@ -35,26 +35,13 @@ end
 @testset "Linear Interpolation" begin
     test_interpolation_type(LinearInterpolation)
 
-    # `LinearInterpolation`'s cache type encodes uniformity statically. For
-    # `AbstractRange` knots the tag resolves at compile time, so the
-    # constructor is type-stable and `@inferred` succeeds. For `Vector`
-    # knots the tag depends on the values, so the constructor returns
-    # `Union{LinearInterpolation{..., true}, LinearInterpolation{..., false}}`
-    # and `@inferred` on the constructor does not hold (per-query dispatch
-    # on the resulting instance remains type-stable).
     for t in (1.0:10.0, 1.0collect(1:10))
         u = 2.0collect(1:10)
-        A = if t isa AbstractRange
-            @inferred(
-                LinearInterpolation(
-                    u, t; extrapolation = ExtrapolationType.Extension
-                )
-            )
-        else
+        A = @inferred(
             LinearInterpolation(
                 u, t; extrapolation = ExtrapolationType.Extension
             )
-        end
+        )
 
         for (_t, _u) in zip(t, u)
             @test A(_t) == _u
@@ -66,18 +53,11 @@ end
         @test @inferred(output_size(A)) == ()
 
         u = vcat(2.0collect(1:10)', 3.0collect(1:10)')
-        if t isa AbstractRange
-            @test @inferred(
-                LinearInterpolation(
-                    u, t; extrapolation = ExtrapolationType.Extension
-                )
-            ) isa LinearInterpolation broken = VERSION <
-                v"1.11"
-        else
-            @test LinearInterpolation(
+        @test @inferred(
+            LinearInterpolation(
                 u, t; extrapolation = ExtrapolationType.Extension
-            ) isa LinearInterpolation
-        end
+            )
+        ) isa LinearInterpolation broken = VERSION < v"1.11" && t isa AbstractRange
         A = LinearInterpolation(
             u, t; extrapolation = ExtrapolationType.Extension
         )
@@ -95,18 +75,11 @@ end
         y = 2:4
         u_ = x' .* y
         u = [u_[:, i] for i in 1:size(u_, 2)]
-        if t isa AbstractRange
-            @test @inferred(
-                LinearInterpolation(
-                    u, t; extrapolation = ExtrapolationType.Extension
-                )
-            ) isa LinearInterpolation broken = VERSION <
-                v"1.11"
-        else
-            @test LinearInterpolation(
+        @test @inferred(
+            LinearInterpolation(
                 u, t; extrapolation = ExtrapolationType.Extension
-            ) isa LinearInterpolation
-        end
+            )
+        ) isa LinearInterpolation broken = VERSION < v"1.11" && t isa AbstractRange
         A = LinearInterpolation(
             u, t; extrapolation = ExtrapolationType.Extension
         )
@@ -118,17 +91,11 @@ end
 
         # Test allocation-free interpolation with StaticArrays
         u_s = [convert(SVector{length(y), eltype(u_)}, i) for i in u]
-        if t isa AbstractRange
-            @test @inferred(
-                LinearInterpolation(
-                    u_s, t; extrapolation = ExtrapolationType.Extension
-                )
-            ) isa LinearInterpolation
-        else
-            @test LinearInterpolation(
+        @test @inferred(
+            LinearInterpolation(
                 u_s, t; extrapolation = ExtrapolationType.Extension
-            ) isa LinearInterpolation
-        end
+            )
+        ) isa LinearInterpolation
         A_s = LinearInterpolation(u_s, t; extrapolation = ExtrapolationType.Extension)
         for x in (0, 5.5, 11)
             @test A(x) == A_s(x)
@@ -210,9 +177,7 @@ end
     # Test type stability
     u = Float32.(1:5)
     t = Float32.(1:5)
-    # `Float32.(1:5)` materialises a `Vector{Float32}`; the constructor is
-    # value-dependent for `Vector` knots (see Type Inference testset).
-    A1 = LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension)
+    A1 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
     u = 1:5
     t = 1:5
     A2 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
@@ -221,8 +186,7 @@ end
     A3 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
     u = [1 // i for i in 1:5]
     t = [1 // (6 - i) for i in 1:5]
-    # Vector knots — constructor is type-unstable (see Type Inference testset).
-    A4 = LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension)
+    A4 = @inferred(LinearInterpolation(u, t; extrapolation = ExtrapolationType.Extension))
 
     F32 = Float32(1)
     F64 = Float64(1)
@@ -416,7 +380,7 @@ end
         for t in (t_r, t_v)
             A = LinearInterpolation(u, t)
             @test A.t_props.is_uniform
-            @test A.is_uniform_static === Val(true)
+            @test A.kind === FindFirstFunctions.KIND_UNIFORM_STEP
 
             # Tolerance scaled to `length(t) * eps * max(|u|)`; the realistic
             # ulp gap at the per-segment scale is O(length(t)).
@@ -432,7 +396,7 @@ end
         t_nu = sort!(rand(StableRNG(0xcafef00d), n)) .* 10.0
         A_nu = LinearInterpolation(u, t_nu)
         @test !A_nu.t_props.is_uniform
-        @test A_nu.is_uniform_static === Val(false)
+        @test A_nu.kind !== FindFirstFunctions.KIND_UNIFORM_STEP
         qs_nu = sort!(rand(StableRNG(0x0b0bcafe), 5000)) .* (last(t_nu) - first(t_nu)) .+
             first(t_nu)
         for q in qs_nu
@@ -446,7 +410,7 @@ end
         t_trick[52:60] .= range(54.5, 60.0, length = 9)
         A_trick = LinearInterpolation(randn(StableRNG(0xdeadbeef), 101), t_trick)
         @test !A_trick.t_props.is_uniform
-        @test A_trick.is_uniform_static === Val(false)
+        @test A_trick.kind !== FindFirstFunctions.KIND_UNIFORM_STEP
 
         # Extension extrapolation reaches the fast path with t far outside
         # the knot span, where the closed-form float index exceeds
@@ -458,13 +422,13 @@ end
             @test isapprox(A_ext(q), slope_form_eval(A_ext, q); rtol = 1.0e-10)
         end
 
-        # push! mutates A.t while t_props (and the IsUniform type tag)
+        # push! mutates A.t while t_props (and the cached kind)
         # keep their construction-time values. The fast path must detect
         # the stale cell/spacing against the live knots and fall back
         # rather than silently interpolate with the stale inv_step.
         t_m = collect(0.0:1.0:10.0)
         A_m = LinearInterpolation(sin.(t_m), t_m)
-        @test A_m.is_uniform_static === Val(true)
+        @test A_m.kind === FindFirstFunctions.KIND_UNIFORM_STEP
         push!(A_m, -0.3, 10.5)   # breaks the uniform spacing (1.0 → 0.5)
         # Queries in the mutated region must fall back to the slope path
         # (exact match); queries in the untouched uniform region still

From f09c1b89ff1962c079320d9140886d376d2f6fc7 Mon Sep 17 00:00:00 2001
From: ChrisRackauckas-Claude <accounts@chrisrackauckas.com>
Date: Fri, 19 Jun 2026 11:22:06 -0400
Subject: [PATCH 24/24] Add a static lean fast path for AbstractRange knots
 (1.8x on range A(q))
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The single runtime-kind-branch uniform path is right for Vector knots
(uniformity is a value property; a Vector can be push!-mutated or
caller-forced-uniform on jittered data, so it needs the live-knot
cell/spacing verification + slope fallback). But an AbstractRange is
uniform at the *type* level and is immutable + exactly spaced, so it can
take a leaner kernel — dispatched statically on typeof(t), which is
inference-safe (no value-dependent Union, unlike the old IsUniform tag).

Add _interpolate(::LinearInterpolation{<:AbstractVector{<:AbstractFloat},
<:AbstractRange}, ...) → _linear_uniform_range_interpolate, which:
  - skips the runtime kind branch (ranges are always KIND_UNIFORM_STEP),
  - skips the cell/spacing verification (a range can't go stale),
  - computes α directly from the float position (α = f - idx0), avoiding
    the two A.t[idx] range-arithmetic loads,
  - skips the vestigial iguesser store (the closed form never searches).
It keeps full NaN handling (NaN query → NaN derivative; NaN-adjacent u
resolved by exact-knot comparison), matching the other methods.

Vector knots keep the runtime-branch verified path unchanged; non-Float
u and non-uniform knots keep the slope form.

Measured per-query (n=10k, monomorphic loop): range A(q) 30.5 -> 17.0
ns/q; uniform Vector unchanged (18.4); non-uniform unchanged. Inference
stays clean (constructor + query inferred for both Range and Vector),
AD works through the kernel (Mooncake/Zygote/SCT green), and it is
allocation-free (AllocCheck). All 5 groups pass against registered
FindFirstFunctions v3.0.0.

Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Co-Authored-By: Chris Rackauckas <accounts@chrisrackauckas.com>
---
 src/interpolation_methods.jl | 68 +++++++++++++++++++++++++++++++++---
 1 file changed, 63 insertions(+), 5 deletions(-)

diff --git a/src/interpolation_methods.jl b/src/interpolation_methods.jl
index ad50df9b..07a92cb1 100644
--- a/src/interpolation_methods.jl
+++ b/src/interpolation_methods.jl
@@ -169,11 +169,26 @@ function _extrapolate_right(A::SmoothedConstantInterpolation, t)
     end
 end
 
-# Linear Interpolation. Float-valued knots take the uniform-grid closed-form
-# fast path when `kind === KIND_UNIFORM_STEP`. The choice is a runtime branch
-# on the cached enum — not a cache type parameter — so the constructor stays
-# fully type-inferred, and both arms return the same concrete value type so
-# the query stays inferred too. Non-Float `u` always uses the slope form.
+# Linear Interpolation — two uniform fast paths, both inference-safe:
+#
+#   1. STATIC, for `AbstractRange` knots. A range is uniform at the *type*
+#      level (no value-dependent tag, so the constructor stays inferred) and
+#      is immutable + exactly spaced, so the lean closed form needs neither
+#      the runtime `kind` branch nor the cell/spacing verification, and it
+#      gets `α` straight from the float position without loading `A.t[idx]`.
+#   2. RUNTIME, for `Vector{<:AbstractFloat}` knots. Uniformity here is a
+#      value property, carried by the `kind` enum; the branch picks the
+#      verified closed form (a `Vector` can be `push!`-mutated or
+#      caller-forced-uniform on jittered data, so it must check the live
+#      knots and fall back). Both arms return the same concrete type.
+#
+# Non-Float `u`, and non-uniform knots, use the slope form.
+function _interpolate(
+        A::LinearInterpolation{<:AbstractVector{<:AbstractFloat}, <:AbstractRange},
+        t::Number, iguess,
+    )
+    return _linear_uniform_range_interpolate(A, t, iguess)
+end
 function _interpolate(
         A::LinearInterpolation{<:AbstractVector{<:AbstractFloat}}, t::Number, iguess,
     )
@@ -187,6 +202,49 @@ function _interpolate(A::LinearInterpolation{<:AbstractVector}, t::Number, igues
     return _linear_slope_interpolate(A, t, iguess)
 end
 
+# Lean uniform kernel for `AbstractRange` knots. No verification (a range is
+# immutable and exactly uniform) and no `A.t[idx]` load (`α` is the
+# fractional part of the float position `f`). NaN handling matches the other
+# methods: a NaN query propagates through the partial of `t` for correct
+# derivatives, and a NaN-adjacent `u` is resolved by exact-knot comparison.
+@inline function _linear_uniform_range_interpolate(
+        A::LinearInterpolation{<:AbstractVector{<:AbstractFloat}}, t::Number, iguess,
+    )
+    if isnan(t)
+        idx = firstindex(A.u)
+        u1 = oneunit(eltype(A.u))
+        slope = t / t * get_parameters(A, idx)
+        Δu = slope * (t - oneunit(eltype(A.t)))
+        return oftype(Δu, u1) + Δu
+    end
+    props = A.t_props
+    f = (t - props.first_val) * props.inv_step
+    n = length(A.t)
+    idx0 = if f < 0
+        0
+    elseif f > n - 2
+        n - 2
+    else
+        unsafe_trunc(Int, floor(f))
+    end
+    α = f - idx0
+    @inbounds u1 = A.u[idx0 + 1]
+    @inbounds u2 = A.u[idx0 + 2]
+    Δu = α * (u2 - u1)
+    if any(isnan.(Δu))
+        # `0 * NaN = NaN` poisons exact-knot queries when a neighbour is NaN;
+        # resolve by comparing the query to the bracketing knots directly.
+        @inbounds t1 = A.t[idx0 + 1]
+        @inbounds t2 = A.t[idx0 + 2]
+        if t == t2
+            return u2 + zero(Δu)
+        elseif t == t1
+            return u1 + zero(Δu)
+        end
+    end
+    return u1 + Δu
+end
+
 function _linear_slope_interpolate(A::LinearInterpolation, t::Number, iguess)
     if isnan(t)
         # For correct derivative with NaN