Experiment 025 — f32 vs f64 Precision Drift

Rendered from exp-025-precision-drift.ipynb

Experiment 025 — f32 vs f64 Precision Drift

Validates the analysis methodology for detecting f32→f64 precision drift in WDM (Warm Dense Matter) transport coefficient calculations via Green-Kubo integration of velocity autocorrelation functions. Core idea:

Synthetic VACF: C(t) = c0 * exp(-t/tau) with additive noise
Trapezoidal integration in f64 (reference) vs f32 accumulation (GPU-like)
Bias-variance decomposition of f32-f64 differences
Error-magnitude correlation (larger integrals → larger rounding drift) References: IEEE 754-2019, Higham (2002) Accuracy and Stability of Numerical Algorithms

Domain: Numerical Methods Faculty: WDM Reference: WDM float precision analysis

Data source: control/precision_drift/precision_drift.py + benchmark_*.json

This notebook is the publication-grade Python baseline for Experiment 025. The identical computations are validated in Rust (see validate_* binary) and delegated to barraCuda for GPU acceleration.

import json
import math
import sys
from pathlib import Path

import numpy as np
import matplotlib.pyplot as plt

# Wire path to groundSpring control/ for common utilities
CONTROL = Path('..') / '..' / 'control'
sys.path.insert(0, str(CONTROL))
from common import *  # noqa: F403 — validation harness

# Load benchmark data
benchmark_path = CONTROL / 'precision_drift' / 'benchmark_precision_drift.json'
with open(benchmark_path) as f:
    benchmark = json.load(f)

PASS_COLOR = '#2ecc71'
FAIL_COLOR = '#e74c3c'
INFO_COLOR = '#3498db'

print(f'Loaded benchmark: benchmark_precision_drift.json')
print(f'Provenance: {benchmark.get("_provenance", {})}')

Validation

Initialization

print("groundSpring Exp 025: f32 vs f64 Precision Drift")
print("  WDM transport coefficient Green-Kubo integration")

model = benchmark["model"]
exp = benchmark["expected_results"]

c0 = model["c0"]
dt = model["dt"]
d_dim = model["d_dim"]
n_steps = model["n_steps"]
tau_values = model["tau_values"]
noise_amplitude = model["noise_amplitude"]
n_realizations = model["n_realizations"]
seed = model["seed"]

rng = np.random.default_rng(seed)

Noiseless run for f64 vs analytical (check 1)

# Finite window: ∫₀ᵀ c0*exp(-t/τ) dt = c0*τ*(1 - exp(-T/τ))
t_max = (n_steps - 1) * dt
f64_noiseless_max_rel_err = 0.0
for tau in tau_values:
    vacf_clean = c0 * np.exp(-np.arange(n_steps, dtype=np.float64) * dt / tau)
    integral_f64_clean = float(np.trapezoid(vacf_clean, dx=dt))
    analytical_finite = c0 * tau * (1.0 - np.exp(-t_max / tau))
    if analytical_finite != 0:
        rel_err = abs(integral_f64_clean - analytical_finite) / analytical_finite
        f64_noiseless_max_rel_err = max(f64_noiseless_max_rel_err, rel_err)

Collect results across all tau and realizations (noisy)

all_integral_f64: list[float] = []
all_integral_f32: list[float] = []
all_analytical: list[float] = []
tau_per_realization: list[float] = []

for tau in tau_values:
    analytical_integral = c0 * tau

    integrals_f64: list[float] = []
    integrals_f32: list[float] = []
    rel_errors: list[float] = []

    for _ in range(n_realizations):
        vacf = synthetic_vacf_noisy(
            c0, tau, n_steps, dt, noise_amplitude, rng
        )
        integral_f64 = float(np.trapezoid(vacf, dx=dt))
        integral_f32 = green_kubo_f32_scalar(vacf, dt)

        all_integral_f64.append(integral_f64)
        all_integral_f32.append(integral_f32)
        all_analytical.append(analytical_integral)
        tau_per_realization.append(tau)

        integrals_f64.append(integral_f64)
        integrals_f32.append(integral_f32)
        if integral_f64 != 0:
            rel_errors.append((integral_f32 - integral_f64) / integral_f64)

    mean_f64 = float(np.mean(integrals_f64))
    std_f64 = float(np.std(integrals_f64))
    mean_rel = float(np.mean(rel_errors)) if rel_errors else 0.0
    print(
        f"\n  tau={tau:.1f}: f64 mean={mean_f64:.6f}, std={std_f64:.6f}, "
        f"mean_rel_err={mean_rel:.6f}"
    )

Derive global stats

all_relative_errors = [
    (all_integral_f32[i] - all_integral_f64[i]) / all_integral_f64[i]
    for i in range(len(all_integral_f64))
    if all_integral_f64[i] != 0
]
all_abs_errors = [
    abs(all_integral_f32[i] - all_integral_f64[i])
    for i in range(len(all_integral_f64))
    if all_integral_f64[i] != 0
]

Validation Checks

# Check 1: f64 max relative error vs analytical (noiseless VACF)
check_max(
    "f64 max relative error vs analytical (noiseless)",
    f64_noiseless_max_rel_err,
    exp["f64_analytical_max_error"],
)

# Check 2: f32 max relative error vs f64
f32_max_rel_err = max(abs(r) for r in all_relative_errors) if all_relative_errors else 0.0
check_max(
    "f32 max relative error vs f64",
    f32_max_rel_err,
    exp["f32_relative_error_max"],
)

# Check 3: Mean relative error (bias) in range
mean_rel_err = float(np.mean(all_relative_errors)) if all_relative_errors else 0.0
lo, hi = exp["mean_relative_error_range"]
check_range(
    "Mean relative error (bias detection) in range",
    mean_rel_err,
    lo,
    hi,
)

# Check 4: Bias fraction above minimum
errors = np.array(
    [
        all_integral_f32[i] - all_integral_f64[i]
        for i in range(len(all_integral_f64))
    ]
)
mbe = float(np.mean(errors))
rmse = float(np.sqrt(np.mean(errors**2)))
decomp = decompose_error(mbe, rmse)
check_min(
    "Bias fraction above minimum",
    decomp["bias_fraction"],
    exp["bias_fraction_min"],
)

# Check 5: Max absolute diffusion error (f32 vs f64, not vs analytical)
max_diff_err = 0.0
for i in range(len(all_integral_f64)):
    d_f64 = all_integral_f64[i] / d_dim
    d_f32 = all_integral_f32[i] / d_dim
    max_diff_err = max(max_diff_err, abs(d_f32 - d_f64))
check_max(
    "Max absolute diffusion error (f32 vs f64)",
    max_diff_err,
    exp["max_diffusion_absolute_error"],
)

# Check 6: Error-magnitude correlation (|f32-f64| vs expected integral c0*tau)
abs_errors_arr = np.array(all_abs_errors)
expected_magnitudes = np.array(
    [c0 * tau_per_realization[i] for i in range(len(all_integral_f64)) if all_integral_f64[i] != 0]
)
if len(abs_errors_arr) >= 2 and len(abs_errors_arr) == len(expected_magnitudes):
    corr = float(np.corrcoef(abs_errors_arr, expected_magnitudes)[0, 1])
    if np.isnan(corr):
        corr = 0.0
else:
    corr = 0.0
check_min(
    "Error-magnitude correlation (larger integrals → larger errors)",
    corr,
    exp["error_magnitude_correlation_min"],
)

# Check 7: Relative error std bounded
rel_err_std = float(np.std(all_relative_errors)) if all_relative_errors else 0.0
check_max(
    "Relative error std",
    rel_err_std,
    exp["relative_error_std_max"],
)

# Results: {pass_count()}/{total_count()} checks passed
print_summary("Exp 025: f32 vs f64 Precision Drift")

Visualization

# Publication-grade summary chart for Exp 025
fig, ax = plt.subplots(figsize=(8, 4))

p, f_count, t = pass_count(), fail_count(), total_count()
ax.barh(['Pass', 'Fail'], [p, f_count], color=[PASS_COLOR, FAIL_COLOR])
ax.set_xlim(0, max(t * 1.15, 1))
ax.set_title('Exp 025: f32 vs f64 Precision Drift — Validation Results')
ax.set_xlabel('Check Count')
for i, v in enumerate([p, f_count]):
    if v > 0:
        ax.text(v + 0.3, i, str(v), va='center', fontweight='bold')

plt.tight_layout()
plt.savefig(f'/tmp/groundspring_exp025.png', dpi=150, bbox_inches='tight')
plt.show()
print(f'\nResult: {p}/{t} PASS, {f_count}/{t} FAIL')

Provenance & Summary

Field	Value
Experiment	025 — f32 vs f64 Precision Drift
Domain	Numerical Methods
Reference	WDM float precision analysis
Faculty	WDM
Python baseline	`control/precision_drift/precision_drift.py`
Benchmark JSON	`control/precision_drift/benchmark_precision_drift.json`
Rust validator	`validate_*` binary (exit-code protocol)
Rust speedup	See benchmark comparison notebook
License	AGPL-3.0-or-later

Provenance chain: Python baseline → Rust validation → barraCuda GPU → metalForge cross-substrate → primal IPC composition

See primals.eco for rendered lab notebooks.