diff --git a/audit/internal/platform/benchmark_report.go b/audit/internal/platform/benchmark_report.go index 54487f1..b4cadc2 100644 --- a/audit/internal/platform/benchmark_report.go +++ b/audit/internal/platform/benchmark_report.go @@ -86,13 +86,14 @@ func renderBenchmarkReportWithCharts(result NvidiaBenchmarkResult) string { // ── Methodology ─────────────────────────────────────────────────────────── b.WriteString("## Methodology\n\n") - fmt.Fprintf(&b, "- Profile `%s` uses standardized baseline -> warmup -> steady-state -> interconnect phases.\n", result.BenchmarkProfile) + fmt.Fprintf(&b, "- Profile `%s` uses standardized baseline → warmup → steady-state → interconnect phases.\n", result.BenchmarkProfile) b.WriteString("- Single-GPU compute score comes from `bee-gpu-burn` on the cuBLASLt path when available.\n") - b.WriteString("- Thermal and power limits are inferred from NVIDIA clock-event counters plus sustained telemetry.\n") + b.WriteString("- GPUs run at their default power limits — no pre-benchmark power calibration is performed.\n") + b.WriteString("- Throttling and thermal state are inferred from NVIDIA clock-event counters and sustained telemetry.\n") b.WriteString("- `result.json` is the canonical machine-readable source for the run.\n\n") b.WriteString("**Compute score** is derived from two phases:\n\n") b.WriteString("- **Synthetic** — each precision type (int8, fp8, fp16, fp32, fp64, fp4) runs alone for a dedicated window. ") - b.WriteString("Measures peak throughput with the full GPU dedicated to one kernel type. ") + b.WriteString("Measures peak throughput with the full GPU memory budget dedicated to one kernel type. ") b.WriteString("Each result is normalised to fp32-equivalent TOPS using precision weights: ") b.WriteString("fp64 ×2.0 · fp32 ×1.0 · fp16 ×0.5 · int8 ×0.25 · fp8 ×0.25 · fp4 ×0.125.\n") b.WriteString("- **Mixed** — all precision types run simultaneously (combined phase). ") @@ -100,6 +101,11 @@ func renderBenchmarkReportWithCharts(result NvidiaBenchmarkResult) string { b.WriteString("**Formula:** `Compute = Synthetic × (1 + MixedEfficiency × 0.3)`\n\n") b.WriteString("where `MixedEfficiency = Mixed / Synthetic`. A GPU that sustains 90 % throughput under mixed load ") b.WriteString("receives a +27 % bonus over its synthetic score; one that drops to 60 % receives +18 %.\n\n") + b.WriteString("**Platform power score** — after all single-GPU runs, a ramp-up phase adds GPUs one by one (k=2..N) ") + b.WriteString("and measures total Synthetic TOPS. Scalability for step k = `k_total_TOPS / (k × best_single_TOPS) × 100`. ") + b.WriteString("`PlatformPowerScore` = mean scalability across all ramp steps. 100 % means linear scaling.\n\n") + b.WriteString("**PowerSustainScore** — measures how close the GPU ran to its rated TDP during steady-state load. ") + b.WriteString("Uses steady-state average power as the reference (no external calibration needed).\n\n") b.WriteString("**Composite score** = `Compute × quality_factor` where quality factors in power sustain, thermal sustain, stability, and interconnect.\n\n") // ── Scorecard table ─────────────────────────────────────────────────────── @@ -174,13 +180,13 @@ func renderBenchmarkReportWithCharts(result NvidiaBenchmarkResult) string { fmt.Fprintf(&b, "- **Power limit:** %.0f W (default %.0f W)\n", gpu.PowerLimitW, gpu.DefaultPowerLimitW) } if gpu.PowerLimitDerated { - fmt.Fprintf(&b, "- **Power limit derating:** active after %d targeted_power attempt(s)\n", gpu.PowerCalibrationTries) + fmt.Fprintf(&b, "- **Power limit derating:** active (reduced limit %.0f W)\n", gpu.PowerLimitW) } if gpu.CalibratedPeakPowerW > 0 { if gpu.CalibratedPeakTempC > 0 { - fmt.Fprintf(&b, "- **Power calibration (`dcgmi targeted_power`):** %.0f W p95 at %.1f °C p95\n", gpu.CalibratedPeakPowerW, gpu.CalibratedPeakTempC) + fmt.Fprintf(&b, "- **Calibrated peak power:** %.0f W p95 at %.1f °C p95\n", gpu.CalibratedPeakPowerW, gpu.CalibratedPeakTempC) } else { - fmt.Fprintf(&b, "- **Power calibration (`dcgmi targeted_power`):** %.0f W p95\n", gpu.CalibratedPeakPowerW) + fmt.Fprintf(&b, "- **Calibrated peak power:** %.0f W p95\n", gpu.CalibratedPeakPowerW) } } if gpu.LockedGraphicsClockMHz > 0 {