From 842fa924386e2e9c317c643ddbe6daef8e564976 Mon Sep 17 00:00:00 2001 From: Mikhail Chusavitin Date: Fri, 17 Apr 2026 13:39:02 +0300 Subject: [PATCH] commit results --- perf/perf-20260416-052102/result.json | 2286 ++++++++++++++++++++++ perf/perf-20260416-231014/result.json | 2378 +++++++++++++++++++++++ perf/perf-20260417-050338/result.json | 2376 ++++++++++++++++++++++ perf/perf-20260417-154119/result.json | 1840 ++++++++++++++++++ power/power-20260414-202612/result.json | 42 + power/power-20260414-203047/result.json | 74 + power/power-20260414-203715/result.json | 106 + power/power-20260414-204624/result.json | 141 ++ power/power-20260416-044811/result.json | 240 +++ power/power-20260416-053129/result.json | 240 +++ power/power-20260416-223651/result.json | 248 +++ power/power-20260417-150143/result.json | 248 +++ 12 files changed, 10219 insertions(+) create mode 100644 perf/perf-20260416-052102/result.json create mode 100644 perf/perf-20260416-231014/result.json create mode 100644 perf/perf-20260417-050338/result.json create mode 100644 perf/perf-20260417-154119/result.json create mode 100644 power/power-20260414-202612/result.json create mode 100644 power/power-20260414-203047/result.json create mode 100644 power/power-20260414-203715/result.json create mode 100644 power/power-20260414-204624/result.json create mode 100644 power/power-20260416-044811/result.json create mode 100644 power/power-20260416-053129/result.json create mode 100644 power/power-20260416-223651/result.json create mode 100644 power/power-20260417-150143/result.json diff --git a/perf/perf-20260416-052102/result.json b/perf/perf-20260416-052102/result.json new file mode 100644 index 0000000..59ee0d9 --- /dev/null +++ b/perf/perf-20260416-052102/result.json @@ -0,0 +1,2286 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-16T05:21:02.2190505Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "standard", + "parallel_gpus": true, + "ramp_total": 8, + "ramp_run_id": "ramp-20260416-043044", + "overall_status": "FAILED", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "findings": [ + "0 of 8 GPU(s) passed the benchmark.", + "GPU 0 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "GPU 1 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "GPU 2 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "GPU 3 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "GPU 4 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "GPU 5 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "GPU 6 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "GPU 7 had incomplete precision coverage: fp64:FAILED, fp4:FAILED.", + "Multi-GPU all_reduce max bus bandwidth: 3.9 GB/s." + ], + "normalization": { + "status": "full", + "gpus": [ + { + "index": 0, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 1, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 2, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 3, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 4, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 5, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 6, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 7, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + } + ] + }, + "host_config": { + "cpu_model": "INTEL(R) XEON(R) GOLD 6530", + "cpu_sockets": 2, + "cpu_cores": 64, + "cpu_threads": 128, + "mem_total_gib": 125.36545181274414 + }, + "cpu_load": { + "avg_pct": 4.2, + "max_pct": 8.4, + "p95_pct": 7.9, + "samples": 62, + "status": "ok" + }, + "cooling": { + "available": true, + "avg_fan_rpm": 14154.940277777778, + "notes": [ + "fan duty cycle unavailable on this host; RPM-only fan telemetry was collected" + ] + }, + "gpus": [ + { + "index": 0, + "uuid": "GPU-8281bc14-c076-e306-75b1-e91596be45e7", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 57, + "p95_temp_c": 58.85, + "avg_power_w": 96.22, + "p95_power_w": 98.126, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.5019915264964885, + "temp_cv_pct": 2.773927772077526, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 51, + "p95_temp_c": 51.85, + "avg_power_w": 91.355, + "p95_power_w": 92.31299999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.7733045860923672, + "temp_cv_pct": 1.386483884679505, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 72, + "p95_temp_c": 75, + "avg_power_w": 529.4629411764705, + "p95_power_w": 553.928, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 39, + "clock_cv_pct": 0, + "power_cv_pct": 12.497271117943772, + "temp_cv_pct": 5.8732682207880496, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 73.54545454545455, + "p95_temp_c": 74, + "avg_power_w": 535.1590909090908, + "p95_power_w": 552.91, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 29.90909090909091, + "clock_cv_pct": 0, + "power_cv_pct": 3.6202719707043056, + "temp_cv_pct": 0.6770365358531101, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 72.15384615384616, + "p95_temp_c": 73, + "avg_power_w": 512.2153846153847, + "p95_power_w": 514.4499999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.307692307692307, + "clock_cv_pct": 0, + "power_cv_pct": 0.5924890406655379, + "temp_cv_pct": 0.7386144168737215, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 71.80952380952381, + "p95_temp_c": 72, + "avg_power_w": 513.3733333333334, + "p95_power_w": 514.91, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.80952380952381, + "clock_cv_pct": 0, + "power_cv_pct": 0.5219290159565562, + "temp_cv_pct": 0.5468309848299284, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 71, + "p95_temp_c": 71, + "avg_power_w": 507.62588235294123, + "p95_power_w": 508.52, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 33.11764705882353, + "clock_cv_pct": 0, + "power_cv_pct": 0.11538475287053507, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 68.61904761904762, + "p95_temp_c": 71, + "avg_power_w": 431.39571428571423, + "p95_power_w": 508.26, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 80.95238095238095, + "avg_mem_usage_pct": 25.523809523809526, + "clock_cv_pct": 0, + "power_cv_pct": 36.360837367320755, + "temp_cv_pct": 7.216542968136386, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.5773759015594, + "synthetic_score": 1286.5773759015594, + "power_sustain_score": 74.65966038426298, + "thermal_sustain_score": 95.84054834596148, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 38.15, + "interconnect_score": 3.93, + "server_quality_score": 91.15006261906734, + "composite_score": 1286.5773759015594 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + }, + { + "index": 1, + "uuid": "GPU-a66d6d68-9870-dfe0-1823-b38a141c21ae", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 58.5, + "p95_temp_c": 59.85, + "avg_power_w": 94.40750000000001, + "p95_power_w": 96.1075, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.328010909383179, + "temp_cv_pct": 1.9111692115382817, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 53.25, + "p95_temp_c": 53.85, + "avg_power_w": 90.3175, + "p95_power_w": 90.9165, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.5192883573918129, + "temp_cv_pct": 0.813169393224825, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 73.47058823529412, + "p95_temp_c": 76, + "avg_power_w": 532.3541176470588, + "p95_power_w": 555.658, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 38.11764705882353, + "clock_cv_pct": 0, + "power_cv_pct": 14.307554722478269, + "temp_cv_pct": 5.585005613000892, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 75, + "p95_temp_c": 75, + "avg_power_w": 537.2013636363637, + "p95_power_w": 554.6, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 29.40909090909091, + "clock_cv_pct": 0, + "power_cv_pct": 3.5141873681220037, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 73.84615384615384, + "p95_temp_c": 74.4, + "avg_power_w": 518.3176923076923, + "p95_power_w": 526.056, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.307692307692307, + "clock_cv_pct": 0, + "power_cv_pct": 0.9687335115374177, + "temp_cv_pct": 0.7216878364870324, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 73.95238095238095, + "p95_temp_c": 74, + "avg_power_w": 524.8838095238095, + "p95_power_w": 527.03, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.714285714285715, + "clock_cv_pct": 0, + "power_cv_pct": 0.6950004038040529, + "temp_cv_pct": 0.28796754378619316, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 73.23529411764706, + "p95_temp_c": 74, + "avg_power_w": 517.9717647058823, + "p95_power_w": 519.466, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.529411764705884, + "clock_cv_pct": 0, + "power_cv_pct": 0.19801583726916133, + "temp_cv_pct": 0.5792050241709219, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 70.9047619047619, + "p95_temp_c": 74, + "avg_power_w": 439.3480952380952, + "p95_power_w": 518.19, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 85.71428571428571, + "avg_mem_usage_pct": 25.095238095238095, + "clock_cv_pct": 0, + "power_cv_pct": 36.60839658818766, + "temp_cv_pct": 6.894208274981244, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.5773759015594, + "synthetic_score": 1286.5773759015594, + "power_sustain_score": 73.49158741172788, + "thermal_sustain_score": 97.56049182032552, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 36.15, + "interconnect_score": 3.93, + "server_quality_score": 91.31562376961601, + "composite_score": 1286.5773759015594 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + }, + { + "index": 2, + "uuid": "GPU-82b32f5b-5fca-9674-a845-cfd5da365d09", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 57.5, + "p95_temp_c": 58.85, + "avg_power_w": 97.86499999999998, + "p95_power_w": 99.59949999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.4553702270844329, + "temp_cv_pct": 1.9444069369563388, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 52.5, + "p95_temp_c": 53.7, + "avg_power_w": 94.0425, + "p95_power_w": 94.9945, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.7464443126388652, + "temp_cv_pct": 1.649572197684645, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 72.17647058823529, + "p95_temp_c": 75, + "avg_power_w": 534.7517647058822, + "p95_power_w": 563.6859999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 39, + "clock_cv_pct": 0, + "power_cv_pct": 16.653238714859476, + "temp_cv_pct": 5.824798169586192, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 74.4090909090909, + "p95_temp_c": 75, + "avg_power_w": 545.8972727272726, + "p95_power_w": 563.7080000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 29.454545454545453, + "clock_cv_pct": 0, + "power_cv_pct": 3.5377165303237597, + "temp_cv_pct": 0.6607607713128876, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 73.6923076923077, + "p95_temp_c": 74, + "avg_power_w": 525.6192307692307, + "p95_power_w": 530.63, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 22.923076923076923, + "clock_cv_pct": 0, + "power_cv_pct": 0.608774842413476, + "temp_cv_pct": 0.6263048016701461, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 73.33333333333333, + "p95_temp_c": 74, + "avg_power_w": 531.1885714285715, + "p95_power_w": 536.36, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 33.285714285714285, + "clock_cv_pct": 0, + "power_cv_pct": 0.8605826463854318, + "temp_cv_pct": 0.6428243465332251, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 73, + "p95_temp_c": 73, + "avg_power_w": 522.3964705882354, + "p95_power_w": 523.258, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.76470588235294, + "clock_cv_pct": 0, + "power_cv_pct": 0.1318213063218618, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 70.57142857142857, + "p95_temp_c": 73, + "avg_power_w": 445.0742857142856, + "p95_power_w": 523.65, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 85.71428571428571, + "avg_mem_usage_pct": 25.238095238095237, + "clock_cv_pct": 0, + "power_cv_pct": 36.13635716216825, + "temp_cv_pct": 7.232889174554178, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.5773759015594, + "synthetic_score": 1286.5773759015594, + "power_sustain_score": 72.43726631318134, + "thermal_sustain_score": 95.05128340694607, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 36.3, + "interconnect_score": 3.93, + "server_quality_score": 90.24656491603822, + "composite_score": 1286.5773759015594 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + }, + { + "index": 3, + "uuid": "GPU-c88562a9-54cd-c3cf-c3fc-ef6c68ce5228", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4F:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 57.5, + "p95_temp_c": 58.85, + "avg_power_w": 93.04750000000001, + "p95_power_w": 95.244, + "avg_graphics_clock_mhz": 2426, + "p95_graphics_clock_mhz": 2430, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0.16488046166529266, + "power_cv_pct": 1.7541716203548638, + "temp_cv_pct": 1.9444069369563388, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 53.75, + "p95_temp_c": 54.85, + "avg_power_w": 90.64500000000001, + "p95_power_w": 91.8855, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.0070181373890594, + "temp_cv_pct": 1.542616181560651, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 73.41176470588235, + "p95_temp_c": 76.2, + "avg_power_w": 531.6388235294116, + "p95_power_w": 560.468, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.70588235294117, + "avg_mem_usage_pct": 38.88235294117647, + "clock_cv_pct": 0, + "power_cv_pct": 17.55567073201338, + "temp_cv_pct": 6.441231253353008, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 75.86363636363636, + "p95_temp_c": 76, + "avg_power_w": 542.4795454545455, + "p95_power_w": 560.0174999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 29.90909090909091, + "clock_cv_pct": 0, + "power_cv_pct": 3.5091137269134984, + "temp_cv_pct": 0.4523567666429449, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 74.6923076923077, + "p95_temp_c": 75, + "avg_power_w": 523.6015384615384, + "p95_power_w": 531.63, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.307692307692307, + "clock_cv_pct": 0, + "power_cv_pct": 0.9847290970046302, + "temp_cv_pct": 0.6179196704428425, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 74.85714285714286, + "p95_temp_c": 75, + "avg_power_w": 531.0157142857142, + "p95_power_w": 533.06, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 33.285714285714285, + "clock_cv_pct": 0, + "power_cv_pct": 0.5795811485328938, + "temp_cv_pct": 0.4674598745769424, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 74, + "p95_temp_c": 74, + "avg_power_w": 524.1370588235294, + "p95_power_w": 525.092, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.35294117647059, + "clock_cv_pct": 0, + "power_cv_pct": 0.13435809987867442, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 71.61904761904762, + "p95_temp_c": 74, + "avg_power_w": 445.3409523809524, + "p95_power_w": 524.91, + "avg_graphics_clock_mhz": 2422.7619047619046, + "p95_graphics_clock_mhz": 2430, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 85.71428571428571, + "avg_mem_usage_pct": 26.238095238095237, + "clock_cv_pct": 0.096928558559204, + "power_cv_pct": 36.55528196225396, + "temp_cv_pct": 6.967755189526102, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.5773759015594, + "synthetic_score": 1286.5773759015594, + "power_sustain_score": 71.95160693116179, + "thermal_sustain_score": 95.37215145531805, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 35.15, + "interconnect_score": 3.93, + "server_quality_score": 90.19712751594395, + "composite_score": 1286.5773759015594 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + }, + { + "index": 4, + "uuid": "GPU-19d64ace-f127-d9a8-1999-ffe37453b930", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CB:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 53.75, + "p95_temp_c": 55.7, + "avg_power_w": 91.32, + "p95_power_w": 92.6295, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.077804406758076, + "temp_cv_pct": 2.75166501539517, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 48.75, + "p95_temp_c": 49.85, + "avg_power_w": 87.87, + "p95_power_w": 88.926, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.8673066522479822, + "temp_cv_pct": 1.700833225823282, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 67.3529411764706, + "p95_temp_c": 70.2, + "avg_power_w": 517.0629411764705, + "p95_power_w": 547.5780000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 94.11764705882354, + "avg_mem_usage_pct": 36.705882352941174, + "clock_cv_pct": 0, + "power_cv_pct": 20.706808896232186, + "temp_cv_pct": 8.67139401257915, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.5066113409025, + "weighted_teraops_per_sec": 327.3766528352256, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 69.86363636363636, + "p95_temp_c": 70, + "avg_power_w": 516.8804545454545, + "p95_power_w": 546.919, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 29.90909090909091, + "clock_cv_pct": 0, + "power_cv_pct": 12.638970766807272, + "temp_cv_pct": 0.4912058838822869, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 68.76923076923077, + "p95_temp_c": 69, + "avg_power_w": 511.02461538461534, + "p95_power_w": 518.8140000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.307692307692307, + "clock_cv_pct": 0, + "power_cv_pct": 0.9994438912853532, + "temp_cv_pct": 0.6126650531377696, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 69, + "p95_temp_c": 69, + "avg_power_w": 518.3838095238094, + "p95_power_w": 520.48, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.714285714285715, + "clock_cv_pct": 0, + "power_cv_pct": 0.5866792968543877, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 69, + "p95_temp_c": 69, + "avg_power_w": 511.9747058823529, + "p95_power_w": 513.6460000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.294117647058826, + "clock_cv_pct": 0, + "power_cv_pct": 0.17039663044581294, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 66.71428571428571, + "p95_temp_c": 69, + "avg_power_w": 445.00666666666666, + "p95_power_w": 514.14, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 80.95238095238095, + "avg_mem_usage_pct": 26.38095238095238, + "clock_cv_pct": 0, + "power_cv_pct": 33.13978733208857, + "temp_cv_pct": 7.168385400007874, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.47380846947, + "synthetic_score": 1286.47380846947, + "power_sustain_score": 65.8789565931432, + "thermal_sustain_score": 94.89750032253015, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 40.15, + "interconnect_score": 3.93, + "server_quality_score": 88.23293707470201, + "composite_score": 1286.47380846947 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + }, + { + "index": 5, + "uuid": "GPU-8d5d3b52-6221-c572-e4dc-3eb34699d5a4", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CC:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 55.75, + "p95_temp_c": 57.7, + "avg_power_w": 94.8075, + "p95_power_w": 96.23949999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.2016816336494958, + "temp_cv_pct": 2.6529505753809937, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 51.75, + "p95_temp_c": 52.85, + "avg_power_w": 91.56500000000001, + "p95_power_w": 92.773, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.0024481033157138, + "temp_cv_pct": 1.6022341982393236, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 70.70588235294117, + "p95_temp_c": 74, + "avg_power_w": 525.3429411764706, + "p95_power_w": 559.22, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 94.11764705882354, + "avg_mem_usage_pct": 36.705882352941174, + "clock_cv_pct": 0, + "power_cv_pct": 20.72463101487948, + "temp_cv_pct": 8.795845351101212, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 73, + "p95_temp_c": 73, + "avg_power_w": 527.6845454545455, + "p95_power_w": 558.0785000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 29.90909090909091, + "clock_cv_pct": 0, + "power_cv_pct": 12.657841089839653, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 71.84615384615384, + "p95_temp_c": 73, + "avg_power_w": 520.23, + "p95_power_w": 524.516, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.307692307692307, + "clock_cv_pct": 0, + "power_cv_pct": 0.5328033905788797, + "temp_cv_pct": 0.9210198358718016, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 71.76190476190476, + "p95_temp_c": 72, + "avg_power_w": 523.4190476190478, + "p95_power_w": 525.7, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.57142857142857, + "clock_cv_pct": 0, + "power_cv_pct": 0.7127917296632327, + "temp_cv_pct": 0.5935150570669648, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 71, + "p95_temp_c": 71, + "avg_power_w": 516.5452941176471, + "p95_power_w": 517.524, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 31.705882352941178, + "clock_cv_pct": 0, + "power_cv_pct": 0.12728811595850442, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 68.76190476190476, + "p95_temp_c": 71, + "avg_power_w": 454.16999999999996, + "p95_power_w": 517.4, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 82.38095238095238, + "avg_mem_usage_pct": 26.857142857142858, + "clock_cv_pct": 0, + "power_cv_pct": 31.52423033829762, + "temp_cv_pct": 6.863995397985521, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.5773759015594, + "synthetic_score": 1286.5773759015594, + "power_sustain_score": 66.86020716039133, + "thermal_sustain_score": 95.19329740528202, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 37.15, + "interconnect_score": 3.93, + "server_quality_score": 88.616051369702, + "composite_score": 1286.5773759015594 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + }, + { + "index": 6, + "uuid": "GPU-a23c67ec-a8e2-7ebf-2593-79d73ec889a6", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CE:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 55.5, + "p95_temp_c": 56.85, + "avg_power_w": 97.43, + "p95_power_w": 104.186, + "avg_graphics_clock_mhz": 1876.5, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 50.350850814219164, + "power_cv_pct": 4.96066081944206, + "temp_cv_pct": 2.0144756554052163, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 50.75, + "p95_temp_c": 51.85, + "avg_power_w": 91.47749999999999, + "p95_power_w": 92.5095, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.808327874380238, + "temp_cv_pct": 1.63380531544601, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 68.88235294117646, + "p95_temp_c": 72, + "avg_power_w": 517.9229411764705, + "p95_power_w": 548.558, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 94.11764705882354, + "avg_mem_usage_pct": 36.705882352941174, + "clock_cv_pct": 0, + "power_cv_pct": 20.667662016727217, + "temp_cv_pct": 8.836020696668033, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 71, + "p95_temp_c": 71, + "avg_power_w": 521.1122727272727, + "p95_power_w": 548.4375, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 98.77272727272727, + "avg_mem_usage_pct": 29.90909090909091, + "clock_cv_pct": 0, + "power_cv_pct": 10.254259721288367, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 70.53846153846153, + "p95_temp_c": 71, + "avg_power_w": 512.773076923077, + "p95_power_w": 520.924, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.307692307692307, + "clock_cv_pct": 0, + "power_cv_pct": 1.012015246221984, + "temp_cv_pct": 0.7067329005897339, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 70.42857142857143, + "p95_temp_c": 71, + "avg_power_w": 519.8085714285714, + "p95_power_w": 522.03, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.95238095238095, + "clock_cv_pct": 0, + "power_cv_pct": 0.6870226571499158, + "temp_cv_pct": 0.702657528425508, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 70, + "p95_temp_c": 70, + "avg_power_w": 512.3382352941177, + "p95_power_w": 514.47, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.64705882352941, + "clock_cv_pct": 0, + "power_cv_pct": 0.2509119157816844, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 67.76190476190476, + "p95_temp_c": 70, + "avg_power_w": 451.6680952380952, + "p95_power_w": 514.65, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 84.76190476190476, + "avg_mem_usage_pct": 27.476190476190474, + "clock_cv_pct": 0, + "power_cv_pct": 31.429038464368887, + "temp_cv_pct": 6.965291183900979, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.5773759015594, + "synthetic_score": 1286.5773759015594, + "power_sustain_score": 67.84954498923098, + "thermal_sustain_score": 95.09858405366197, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 38.15, + "interconnect_score": 3.93, + "server_quality_score": 88.88443871286789, + "composite_score": 1286.5773759015594 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + }, + { + "index": 7, + "uuid": "GPU-f9d537b7-86a1-407c-c137-3bc30fb8c2e8", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CF:00.0", + "vbios": "98.02.67.00.0A", + "status": "PARTIAL", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 15.849643133, + "samples": 4, + "avg_temp_c": 56.75, + "p95_temp_c": 58, + "avg_power_w": 82.74249999999999, + "p95_power_w": 92.2765, + "avg_graphics_clock_mhz": 1861.5, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 52.152268473937994, + "power_cv_pct": 19.097161530659708, + "temp_cv_pct": 2.2890539307077673, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 373.111930521, + "samples": 4, + "avg_temp_c": 52.5, + "p95_temp_c": 53.7, + "avg_power_w": 89.30749999999999, + "p95_power_w": 90.23949999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.7464629460625359, + "temp_cv_pct": 1.649572197684645, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 59.248277208, + "samples": 17, + "avg_temp_c": 70.76470588235294, + "p95_temp_c": 74, + "avg_power_w": 518.3476470588236, + "p95_power_w": 549.02, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 94.11764705882354, + "avg_mem_usage_pct": 37.64705882352941, + "clock_cv_pct": 0, + "power_cv_pct": 20.73285229327504, + "temp_cv_pct": 8.541324100724525, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 114.243796414, + "samples": 22, + "avg_temp_c": 73, + "p95_temp_c": 73, + "avg_power_w": 521.6977272727272, + "p95_power_w": 548.938, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 30.454545454545453, + "clock_cv_pct": 0, + "power_cv_pct": 9.827197312111167, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 176.160171192, + "samples": 13, + "avg_temp_c": 72.15384615384616, + "p95_temp_c": 73, + "avg_power_w": 512.693076923077, + "p95_power_w": 520.216, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.923076923076923, + "clock_cv_pct": 0, + "power_cv_pct": 0.954148965153683, + "temp_cv_pct": 0.7386144168737215, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 239.404420095, + "samples": 21, + "avg_temp_c": 72, + "p95_temp_c": 72, + "avg_power_w": 519.4690476190476, + "p95_power_w": 521.45, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 34.42857142857143, + "clock_cv_pct": 0, + "power_cv_pct": 0.648538387021549, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp64", + "status": "FAILED", + "steady": { + "duration_sec": 299.580549419, + "samples": 17, + "avg_temp_c": 72, + "p95_temp_c": 72, + "avg_power_w": 512.9158823529411, + "p95_power_w": 514.176, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.11764705882353, + "clock_cv_pct": 0, + "power_cv_pct": 0.1693223361361277, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + }, + { + "precision": "fp4", + "status": "FAILED", + "steady": { + "duration_sec": 358.09705093, + "samples": 21, + "avg_temp_c": 69.71428571428571, + "p95_temp_c": 72, + "avg_power_w": 449.73476190476185, + "p95_power_w": 514.03, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 80.95238095238095, + "avg_mem_usage_pct": 25.476190476190474, + "clock_cv_pct": 0, + "power_cv_pct": 32.36223879879783, + "temp_cv_pct": 6.859909798778027, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "precision phase failed" + } + ], + "precision_failures": [ + "fp64:FAILED", + "fp4:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 1286.5773759015594, + "synthetic_score": 1286.5773759015594, + "power_sustain_score": 67.65285095375229, + "thermal_sustain_score": 95.05128340694607, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 36.3, + "interconnect_score": 3.93, + "server_quality_score": 88.8112403082095, + "composite_score": 1286.5773759015594 + }, + "notes": [ + "parallel warmup failed: exit status 1" + ] + } + ], + "interconnect": { + "status": "OK", + "attempted": true, + "supported": true, + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "avg_algbw_gbps": 2.2150000000000003, + "max_algbw_gbps": 2.25, + "avg_busbw_gbps": 3.8725, + "max_busbw_gbps": 3.93 + }, + "server_power": { + "available": false, + "notes": [ + "IPMI power reading unavailable; server-side power characterization skipped" + ] + } +} \ No newline at end of file diff --git a/perf/perf-20260416-231014/result.json b/perf/perf-20260416-231014/result.json new file mode 100644 index 0000000..af74918 --- /dev/null +++ b/perf/perf-20260416-231014/result.json @@ -0,0 +1,2378 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-16T23:10:14.868165987Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "stability", + "parallel_gpus": true, + "ramp_total": 8, + "ramp_run_id": "ramp-20260416-195801", + "overall_status": "OK", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "findings": [ + "All 8 GPU(s) passed the benchmark.", + "GPU 0 held clocks without observable throttle counters during steady state.", + "GPU 1 held clocks without observable throttle counters during steady state.", + "GPU 2 held clocks without observable throttle counters during steady state.", + "GPU 3 held clocks without observable throttle counters during steady state.", + "GPU 4 held clocks without observable throttle counters during steady state.", + "GPU 5 held clocks without observable throttle counters during steady state.", + "GPU 6 held clocks without observable throttle counters during steady state.", + "GPU 7 held clocks without observable throttle counters during steady state.", + "Multi-GPU all_reduce max bus bandwidth: 3.9 GB/s." + ], + "normalization": { + "status": "full", + "gpus": [ + { + "index": 0, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 1, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 2, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 3, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 4, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 5, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 6, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 7, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + } + ] + }, + "host_config": { + "cpu_model": "INTEL(R) XEON(R) GOLD 6530", + "cpu_sockets": 2, + "cpu_cores": 64, + "cpu_threads": 128, + "mem_total_gib": 125.36545181274414 + }, + "cpu_load": { + "avg_pct": 5.9, + "max_pct": 6.8, + "p95_pct": 6.5, + "samples": 547, + "status": "ok" + }, + "cooling": { + "available": true, + "avg_fan_rpm": 16157.092741935483, + "fan_duty_cycle_available": true, + "fan_duty_cycle_estimated": true, + "avg_fan_duty_cycle_pct": 95.04172201137726, + "p95_fan_duty_cycle_pct": 97.52316176470589, + "notes": [ + "fan duty cycle is estimated from the highest fan RPM observed since boot; treat it as an approximation, not a direct PWM reading" + ] + }, + "gpus": [ + { + "index": 0, + "uuid": "GPU-8281bc14-c076-e306-75b1-e91596be45e7", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 53.083333333333336, + "p95_temp_c": 58.45, + "avg_power_w": 92.49833333333333, + "p95_power_w": 96.8575, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 2.8724058393529, + "temp_cv_pct": 6.02915678796594, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 75.45495495495496, + "p95_temp_c": 77, + "avg_power_w": 526.1626201201198, + "p95_power_w": 539.029, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.75150150150151, + "avg_mem_usage_pct": 37.91591591591592, + "clock_cv_pct": 0, + "power_cv_pct": 12.247749716308393, + "temp_cv_pct": 4.44477036768478, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 74.04545454545455, + "p95_temp_c": 76, + "avg_power_w": 549.7471818181817, + "p95_power_w": 556.7, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 39, + "clock_cv_pct": 0, + "power_cv_pct": 5.058044906001502, + "temp_cv_pct": 4.154159865661651, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 73.73529411764706, + "p95_temp_c": 76, + "avg_power_w": 517.4978431372551, + "p95_power_w": 556.788, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 20.764705882352942, + "clock_cv_pct": 0, + "power_cv_pct": 3.2168734476255754, + "temp_cv_pct": 1.229656039940198, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 74.02970297029702, + "p95_temp_c": 75, + "avg_power_w": 527.580099009901, + "p95_power_w": 534.68, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.87128712871287, + "clock_cv_pct": 0, + "power_cv_pct": 1.3419154991125437, + "temp_cv_pct": 0.9777005153134719, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 73.95283018867924, + "p95_temp_c": 75, + "avg_power_w": 518.3751886792452, + "p95_power_w": 532.47, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 31.42452830188679, + "clock_cv_pct": 0, + "power_cv_pct": 1.3201777141699222, + "temp_cv_pct": 0.8588794171201893, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 91.79724132481785, + "thermal_sustain_score": 86.66568889694565, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 13, + "interconnect_score": 3.93, + "server_quality_score": 93.53887906652905, + "composite_score": 1037.2919872321836 + } + }, + { + "index": 1, + "uuid": "GPU-a66d6d68-9870-dfe0-1823-b38a141c21ae", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 54.916666666666664, + "p95_temp_c": 59.9, + "avg_power_w": 91.04166666666667, + "p95_power_w": 95.8445, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 3.041762596894583, + "temp_cv_pct": 5.683860637428844, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 77.58708708708708, + "p95_temp_c": 79, + "avg_power_w": 530.0371996996989, + "p95_power_w": 543.06, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.83333333333333, + "avg_mem_usage_pct": 37.880630630630634, + "clock_cv_pct": 0, + "power_cv_pct": 12.195813371545908, + "temp_cv_pct": 4.304787715567299, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 75.33636363636364, + "p95_temp_c": 77, + "avg_power_w": 551.7380909090908, + "p95_power_w": 556.75, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 38.99090909090909, + "clock_cv_pct": 0, + "power_cv_pct": 4.671882444682097, + "temp_cv_pct": 3.7213044558828408, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 75.48039215686275, + "p95_temp_c": 77, + "avg_power_w": 517.6610784313726, + "p95_power_w": 556.6285, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 20.764705882352942, + "clock_cv_pct": 0, + "power_cv_pct": 4.687675431092306, + "temp_cv_pct": 0.9769194802688033, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 75.7128712871287, + "p95_temp_c": 76, + "avg_power_w": 527.5094059405941, + "p95_power_w": 529.96, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 31.198019801980198, + "clock_cv_pct": 0, + "power_cv_pct": 0.8673096238797479, + "temp_cv_pct": 0.5975498709975604, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 75.37735849056604, + "p95_temp_c": 76, + "avg_power_w": 521.2533962264152, + "p95_power_w": 530.475, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.471698113207545, + "clock_cv_pct": 0, + "power_cv_pct": 2.1058044797610775, + "temp_cv_pct": 0.6430654607592049, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 90.75049601543859, + "thermal_sustain_score": 87.0856368532981, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 11, + "interconnect_score": 3.93, + "server_quality_score": 93.35083986062101, + "composite_score": 1037.2919872321836 + } + }, + { + "index": 2, + "uuid": "GPU-82b32f5b-5fca-9674-a845-cfd5da365d09", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 54, + "p95_temp_c": 59.45, + "avg_power_w": 94.99666666666667, + "p95_power_w": 100.5915, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 3.413139568291253, + "temp_cv_pct": 6.00068583185913, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 77.94444444444444, + "p95_temp_c": 79, + "avg_power_w": 543.9476201201205, + "p95_power_w": 557.4345, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.82432432432432, + "avg_mem_usage_pct": 38.81156156156156, + "clock_cv_pct": 0, + "power_cv_pct": 12.102264359957584, + "temp_cv_pct": 4.529681132735949, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 75.26363636363637, + "p95_temp_c": 77, + "avg_power_w": 561.4788181818179, + "p95_power_w": 569.951, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.13636363636364, + "avg_mem_usage_pct": 39.67272727272727, + "clock_cv_pct": 0, + "power_cv_pct": 7.286272250350883, + "temp_cv_pct": 4.7659675603039, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 75.69607843137256, + "p95_temp_c": 77, + "avg_power_w": 529.8692156862742, + "p95_power_w": 570.065, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 20.852941176470587, + "clock_cv_pct": 0, + "power_cv_pct": 4.303273134555031, + "temp_cv_pct": 1.0096505024062656, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 75.75247524752476, + "p95_temp_c": 76, + "avg_power_w": 539.7018811881187, + "p95_power_w": 542.44, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.94059405940594, + "clock_cv_pct": 0, + "power_cv_pct": 0.9032224896055815, + "temp_cv_pct": 0.5697162388629818, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 76.14150943396227, + "p95_temp_c": 77, + "avg_power_w": 533.7768867924528, + "p95_power_w": 543.01, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 33.37735849056604, + "clock_cv_pct": 0, + "power_cv_pct": 1.7943284980016059, + "temp_cv_pct": 0.45776119940307747, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 89.28467772061518, + "thermal_sustain_score": 86.41095660179215, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 11, + "interconnect_score": 3.93, + "server_quality_score": 92.7086902967222, + "composite_score": 1037.2919872321836 + } + }, + { + "index": 3, + "uuid": "GPU-c88562a9-54cd-c3cf-c3fc-ef6c68ce5228", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4F:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 55.25, + "p95_temp_c": 60.45, + "avg_power_w": 91.76166666666667, + "p95_power_w": 96.3165, + "avg_graphics_clock_mhz": 2387.6666666666665, + "p95_graphics_clock_mhz": 2425.6, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 4.871020012266003, + "power_cv_pct": 3.077204239271844, + "temp_cv_pct": 5.486133779629928, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 78.71846846846847, + "p95_temp_c": 80, + "avg_power_w": 537.4380030030027, + "p95_power_w": 550.7945, + "avg_graphics_clock_mhz": 2422.036036036036, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.82357357357357, + "avg_mem_usage_pct": 38.192192192192195, + "clock_cv_pct": 0.02211834097932422, + "power_cv_pct": 12.160060866422937, + "temp_cv_pct": 4.315752968273292, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 76.06363636363636, + "p95_temp_c": 78, + "avg_power_w": 555.6232727272728, + "p95_power_w": 563.6, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.15454545454546, + "avg_mem_usage_pct": 39.69090909090909, + "clock_cv_pct": 0, + "power_cv_pct": 8.154725476989757, + "temp_cv_pct": 4.2850023864457, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 76.5, + "p95_temp_c": 78, + "avg_power_w": 525.0604901960785, + "p95_power_w": 563.5895, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 22.470588235294116, + "clock_cv_pct": 0, + "power_cv_pct": 3.2666139442571684, + "temp_cv_pct": 0.9983825043476776, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 76.70297029702971, + "p95_temp_c": 77, + "avg_power_w": 534.1427722772277, + "p95_power_w": 536.93, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.306930693069305, + "clock_cv_pct": 0, + "power_cv_pct": 0.9340100200794131, + "temp_cv_pct": 0.595739293105168, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 76.73584905660377, + "p95_temp_c": 77, + "avg_power_w": 529.0425471698114, + "p95_power_w": 537.3275000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.301886792452834, + "clock_cv_pct": 0, + "power_cv_pct": 1.5543869990509325, + "temp_cv_pct": 0.5745424856428784, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 89.56769766971703, + "thermal_sustain_score": 87.05274109518012, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 10, + "interconnect_score": 3.93, + "server_quality_score": 92.98613162946914, + "composite_score": 1037.2919872321836 + } + }, + { + "index": 4, + "uuid": "GPU-19d64ace-f127-d9a8-1999-ffe37453b930", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CB:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 49.25, + "p95_temp_c": 54.45, + "avg_power_w": 88.19500000000001, + "p95_power_w": 92.946, + "avg_graphics_clock_mhz": 2251.4166666666665, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 25.129107398517608, + "power_cv_pct": 3.0752964109834484, + "temp_cv_pct": 6.154495255320884, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 71.59984984984985, + "p95_temp_c": 73, + "avg_power_w": 521.2297372372374, + "p95_power_w": 537.5545, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.89789789789789, + "avg_mem_usage_pct": 38.411411411411414, + "clock_cv_pct": 0, + "power_cv_pct": 12.02449172841293, + "temp_cv_pct": 4.411575244241011, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 69.54545454545455, + "p95_temp_c": 71, + "avg_power_w": 539.6916363636363, + "p95_power_w": 547.6285, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.0909090909091, + "avg_mem_usage_pct": 38.64545454545455, + "clock_cv_pct": 0, + "power_cv_pct": 8.700105556509445, + "temp_cv_pct": 5.069469131938643, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 69.92156862745098, + "p95_temp_c": 71, + "avg_power_w": 510.46990196078434, + "p95_power_w": 547.6469999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.02941176470588, + "avg_mem_usage_pct": 20.57843137254902, + "clock_cv_pct": 0, + "power_cv_pct": 2.8934964760680644, + "temp_cv_pct": 1.2774023526562361, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 69.7128712871287, + "p95_temp_c": 70, + "avg_power_w": 517.5977227722769, + "p95_power_w": 521.43, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.01980198019803, + "avg_mem_usage_pct": 30.871287128712872, + "clock_cv_pct": 0, + "power_cv_pct": 2.713301714890644, + "temp_cv_pct": 1.501577348675426, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 70.17924528301887, + "p95_temp_c": 71, + "avg_power_w": 513.6715094339625, + "p95_power_w": 521.95, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.82075471698113, + "avg_mem_usage_pct": 32.0377358490566, + "clock_cv_pct": 0, + "power_cv_pct": 2.458517036581479, + "temp_cv_pct": 0.5805302562626481, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 87.42593441196279, + "thermal_sustain_score": 86.76527426727696, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 17, + "interconnect_score": 3.93, + "server_quality_score": 92.25736260377192, + "composite_score": 1037.2919872321836 + } + }, + { + "index": 5, + "uuid": "GPU-8d5d3b52-6221-c572-e4dc-3eb34699d5a4", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CC:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 51.5, + "p95_temp_c": 56, + "avg_power_w": 87.92083333333333, + "p95_power_w": 93.9665, + "avg_graphics_clock_mhz": 2235.1666666666665, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 27.7230362388219, + "power_cv_pct": 10.628533224332415, + "temp_cv_pct": 5.405596468767011, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 74.99474474474475, + "p95_temp_c": 77, + "avg_power_w": 532.445728228228, + "p95_power_w": 545.8745, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.89789789789789, + "avg_mem_usage_pct": 37.426426426426424, + "clock_cv_pct": 0, + "power_cv_pct": 12.113961662380559, + "temp_cv_pct": 4.385948835435435, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 72.83636363636364, + "p95_temp_c": 74, + "avg_power_w": 550.0222727272728, + "p95_power_w": 558.99, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.0909090909091, + "avg_mem_usage_pct": 36.663636363636364, + "clock_cv_pct": 0, + "power_cv_pct": 8.827574018955248, + "temp_cv_pct": 4.931226450270902, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 72.63725490196079, + "p95_temp_c": 74, + "avg_power_w": 520.3696078431373, + "p95_power_w": 559.09, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.01960784313725, + "avg_mem_usage_pct": 20.245098039215687, + "clock_cv_pct": 0, + "power_cv_pct": 3.096302725917197, + "temp_cv_pct": 1.4527417716932058, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 72.61386138613861, + "p95_temp_c": 73, + "avg_power_w": 523.2740594059408, + "p95_power_w": 527.09, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.05940594059406, + "avg_mem_usage_pct": 29.168316831683168, + "clock_cv_pct": 0, + "power_cv_pct": 3.942122660305547, + "temp_cv_pct": 0.9083490019059991, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 72.40566037735849, + "p95_temp_c": 73.75, + "avg_power_w": 519.8893396226415, + "p95_power_w": 532.225, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 30.264150943396228, + "clock_cv_pct": 0, + "power_cv_pct": 2.394313842638043, + "temp_cv_pct": 0.8220868562526311, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 86.30476506413797, + "thermal_sustain_score": 86.8421534936937, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 13, + "interconnect_score": 3.93, + "server_quality_score": 91.94407556734949, + "composite_score": 1037.2919872321836 + } + }, + { + "index": 6, + "uuid": "GPU-a23c67ec-a8e2-7ebf-2593-79d73ec889a6", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CE:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 50.166666666666664, + "p95_temp_c": 55, + "avg_power_w": 87.04916666666666, + "p95_power_w": 92.6705, + "avg_graphics_clock_mhz": 2235.1666666666665, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 27.7230362388219, + "power_cv_pct": 10.974022263135334, + "temp_cv_pct": 5.744723078335742, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 73.87912912912913, + "p95_temp_c": 75, + "avg_power_w": 524.4442042042043, + "p95_power_w": 537.1345, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.89789789789789, + "avg_mem_usage_pct": 37.33483483483484, + "clock_cv_pct": 0, + "power_cv_pct": 11.997793150952644, + "temp_cv_pct": 4.4144168481136665, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 71.4, + "p95_temp_c": 73, + "avg_power_w": 540.5936363636365, + "p95_power_w": 550.4209999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.0909090909091, + "avg_mem_usage_pct": 37.654545454545456, + "clock_cv_pct": 0, + "power_cv_pct": 9.893728063691723, + "temp_cv_pct": 5.196677264199914, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 71.65686274509804, + "p95_temp_c": 73, + "avg_power_w": 512.805294117647, + "p95_power_w": 550.3190000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.13725490196079, + "avg_mem_usage_pct": 19.627450980392158, + "clock_cv_pct": 0, + "power_cv_pct": 2.6387072677899797, + "temp_cv_pct": 1.1477196405131047, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 71.68316831683168, + "p95_temp_c": 72, + "avg_power_w": 519.6885148514851, + "p95_power_w": 523.86, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.01980198019803, + "avg_mem_usage_pct": 31.257425742574256, + "clock_cv_pct": 0, + "power_cv_pct": 3.3986039822332033, + "temp_cv_pct": 1.4941406474052255, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 72.18867924528301, + "p95_temp_c": 73, + "avg_power_w": 515.4096226415096, + "p95_power_w": 524.22, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.31132075471698, + "clock_cv_pct": 0, + "power_cv_pct": 2.3956437128552244, + "temp_cv_pct": 0.5419874896321945, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 86.2549877300724, + "thermal_sustain_score": 86.756749455659, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 15, + "interconnect_score": 3.93, + "server_quality_score": 91.90352115571943, + "composite_score": 1037.2919872321836 + } + }, + { + "index": 7, + "uuid": "GPU-f9d537b7-86a1-407c-c137-3bc30fb8c2e8", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CF:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 32.806791721, + "samples": 12, + "avg_temp_c": 52.75, + "p95_temp_c": 57.45, + "avg_power_w": 85.78916666666669, + "p95_power_w": 91.6235, + "avg_graphics_clock_mhz": 2235.1666666666665, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 27.7230362388219, + "power_cv_pct": 11.012861736062202, + "temp_cv_pct": 5.798025056398915, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 5022.123737104, + "samples": 1332, + "avg_temp_c": 75.240990990991, + "p95_temp_c": 77, + "avg_power_w": 523.2648123123122, + "p95_power_w": 535.837, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 97.89864864864865, + "avg_mem_usage_pct": 37.78903903903904, + "clock_cv_pct": 0, + "power_cv_pct": 11.96592275643285, + "temp_cv_pct": 4.2445676715616525, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 299.955727617, + "samples": 110, + "avg_temp_c": 72.89090909090909, + "p95_temp_c": 74, + "avg_power_w": 541.5777272727274, + "p95_power_w": 550.811, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.0909090909091, + "avg_mem_usage_pct": 38.64545454545455, + "clock_cv_pct": 0, + "power_cv_pct": 9.663326516087173, + "temp_cv_pct": 4.825141260946495, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 964.2542197270119, + "weighted_teraops_per_sec": 241.06355493175298, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 595.043677476, + "samples": 102, + "avg_temp_c": 73.19607843137256, + "p95_temp_c": 74, + "avg_power_w": 513.094019607843, + "p95_power_w": 550.6795, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 20.96078431372549, + "clock_cv_pct": 0, + "power_cv_pct": 2.2994098585183447, + "temp_cv_pct": 1.0309071205407918, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 899.295761287, + "samples": 101, + "avg_temp_c": 73.14851485148515, + "p95_temp_c": 74, + "avg_power_w": 518.9522772277228, + "p95_power_w": 523.14, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.00990099009901, + "avg_mem_usage_pct": 30.871287128712872, + "clock_cv_pct": 0, + "power_cv_pct": 3.3452561869951416, + "temp_cv_pct": 1.5791889026567636, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 486.013459787066, + "weighted_teraops_per_sec": 243.006729893533, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 1199.663635317, + "samples": 106, + "avg_temp_c": 73.18867924528301, + "p95_temp_c": 74, + "avg_power_w": 515.0624528301889, + "p95_power_w": 523.3875, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 99.62264150943396, + "avg_mem_usage_pct": 31.82075471698113, + "clock_cv_pct": 0, + "power_cv_pct": 2.2402126796462625, + "temp_cv_pct": 0.5345821436794989, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 254.64089346048, + "weighted_teraops_per_sec": 254.64089346048, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 171872, + "teraops_per_sec": 161.06878408851458, + "weight": 0.5, + "weighted_teraops_per_sec": 80.53439204425729 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 171872, + "teraops_per_sec": 54.99239122716445, + "weight": 1, + "weighted_teraops_per_sec": 54.99239122716445 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 171872, + "teraops_per_sec": 245.30921775548188, + "weight": 0.25, + "weighted_teraops_per_sec": 61.32730443887047 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 171872, + "teraops_per_sec": 114.4977128906934, + "weight": 0.25, + "weighted_teraops_per_sec": 28.62442822267335 + } + ], + "scores": { + "compute_score": 1037.2919872321836, + "synthetic_score": 969.648432452294, + "mixed_score": 225.47851593296554, + "mixed_efficiency": 0.2325363589385877, + "power_sustain_score": 86.83884606906481, + "thermal_sustain_score": 87.26629698531504, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 13, + "interconnect_score": 3.93, + "server_quality_score": 92.23154291631396, + "composite_score": 1037.2919872321836 + } + } + ], + "interconnect": { + "status": "OK", + "attempted": true, + "supported": true, + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "avg_algbw_gbps": 2.2075, + "max_algbw_gbps": 2.24, + "avg_busbw_gbps": 3.8674999999999997, + "max_busbw_gbps": 3.93 + }, + "server_power": { + "available": false, + "notes": [ + "IPMI power reading unavailable; server-side power characterization skipped" + ] + } +} \ No newline at end of file diff --git a/perf/perf-20260417-050338/result.json b/perf/perf-20260417-050338/result.json new file mode 100644 index 0000000..79abd58 --- /dev/null +++ b/perf/perf-20260417-050338/result.json @@ -0,0 +1,2376 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-17T05:03:38.379616546Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "standard", + "parallel_gpus": true, + "overall_status": "OK", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "findings": [ + "All 8 GPU(s) passed the benchmark.", + "GPU 0 held clocks without observable throttle counters during steady state.", + "GPU 1 held clocks without observable throttle counters during steady state.", + "GPU 2 held clocks without observable throttle counters during steady state.", + "GPU 3 held clocks without observable throttle counters during steady state.", + "GPU 4 held clocks without observable throttle counters during steady state.", + "GPU 5 held clocks without observable throttle counters during steady state.", + "GPU 6 held clocks without observable throttle counters during steady state.", + "GPU 7 held clocks without observable throttle counters during steady state.", + "Multi-GPU all_reduce max bus bandwidth: 3.9 GB/s." + ], + "normalization": { + "status": "full", + "gpus": [ + { + "index": 0, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 1, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 2, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 3, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 4, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 5, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 6, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + }, + { + "index": 7, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 2430, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 12481, + "memory_clock_lock_status": "applied" + } + ] + }, + "host_config": { + "cpu_model": "INTEL(R) XEON(R) GOLD 6530", + "cpu_sockets": 2, + "cpu_cores": 64, + "cpu_threads": 128, + "mem_total_gib": 125.36545181274414 + }, + "cpu_load": { + "avg_pct": 5, + "max_pct": 8.5, + "p95_pct": 7.1, + "samples": 103, + "status": "ok" + }, + "cooling": { + "available": true, + "avg_fan_rpm": 14379.873670212766, + "fan_duty_cycle_available": true, + "fan_duty_cycle_estimated": true, + "avg_fan_duty_cycle_pct": 84.58749217772139, + "p95_fan_duty_cycle_pct": 97.71507352941177, + "notes": [ + "fan duty cycle is estimated from the highest fan RPM observed since boot; treat it as an approximation, not a direct PWM reading" + ] + }, + "gpus": [ + { + "index": 0, + "uuid": "GPU-8281bc14-c076-e306-75b1-e91596be45e7", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 34.5, + "p95_temp_c": 35, + "avg_power_w": 88.75500000000001, + "p95_power_w": 89.2675, + "avg_graphics_clock_mhz": 2347, + "p95_graphics_clock_mhz": 2347, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.4334856313043878, + "temp_cv_pct": 1.4492753623188406, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 66.94267515923566, + "p95_temp_c": 71, + "avg_power_w": 454.7870700636941, + "p95_power_w": 518.786, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86.62420382165605, + "avg_mem_usage_pct": 31.668789808917197, + "clock_cv_pct": 0, + "power_cv_pct": 31.4196720381678, + "temp_cv_pct": 10.917848750074887, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 71.68181818181819, + "p95_temp_c": 75, + "avg_power_w": 530.340909090909, + "p95_power_w": 554.6435, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 40, + "clock_cv_pct": 0, + "power_cv_pct": 12.222106395916258, + "temp_cv_pct": 6.115516311289504, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 73.27777777777777, + "p95_temp_c": 74.15, + "avg_power_w": 520.6655555555556, + "p95_power_w": 553.3199999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 28.5, + "clock_cv_pct": 0, + "power_cv_pct": 10.91558637787749, + "temp_cv_pct": 1.0960449048370706, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 70.65, + "p95_temp_c": 71.05, + "avg_power_w": 502.6, + "p95_power_w": 510.741, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 24.2, + "clock_cv_pct": 0, + "power_cv_pct": 1.7131526966475623, + "temp_cv_pct": 0.8100157920919742, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 70, + "p95_temp_c": 70, + "avg_power_w": 510.66333333333324, + "p95_power_w": 511.046, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 35, + "clock_cv_pct": 0, + "power_cv_pct": 0.04249871294370823, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.8707734809586, + "synthetic_score": 1286.5773759015594, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17952903281038537, + "power_sustain_score": 81.32999186246123, + "thermal_sustain_score": 67.24645374977534, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 19, + "interconnect_score": 3.91, + "server_quality_score": 84.57293368367097, + "composite_score": 1355.8707734809586 + } + }, + { + "index": 1, + "uuid": "GPU-a66d6d68-9870-dfe0-1823-b38a141c21ae", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 36.5, + "p95_temp_c": 37, + "avg_power_w": 87.58749999999999, + "p95_power_w": 87.871, + "avg_graphics_clock_mhz": 2345.25, + "p95_graphics_clock_mhz": 2347, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0.1292437443021228, + "power_cv_pct": 0.359900775821056, + "temp_cv_pct": 1.36986301369863, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 69.5859872611465, + "p95_temp_c": 73, + "avg_power_w": 463.9425477707005, + "p95_power_w": 530.768, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86.62420382165605, + "avg_mem_usage_pct": 32.554140127388536, + "clock_cv_pct": 0, + "power_cv_pct": 31.941052135085286, + "temp_cv_pct": 10.728391664011546, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 73.54545454545455, + "p95_temp_c": 77, + "avg_power_w": 535.6372727272727, + "p95_power_w": 555.85, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 38, + "clock_cv_pct": 0, + "power_cv_pct": 11.864664390629041, + "temp_cv_pct": 5.7355291758319815, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 74.88888888888889, + "p95_temp_c": 76, + "avg_power_w": 523.5305555555556, + "p95_power_w": 554.4409999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 98.72222222222223, + "avg_mem_usage_pct": 27.333333333333332, + "clock_cv_pct": 0, + "power_cv_pct": 9.669860002564418, + "temp_cv_pct": 0.9841616588591694, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 72.65, + "p95_temp_c": 73.05, + "avg_power_w": 513.4245, + "p95_power_w": 521.882, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 23.4, + "clock_cv_pct": 0, + "power_cv_pct": 1.794579339676941, + "temp_cv_pct": 0.7877166649868959, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 72, + "p95_temp_c": 72, + "avg_power_w": 521.9950000000001, + "p95_power_w": 522.1235, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 33, + "clock_cv_pct": 0, + "power_cv_pct": 0.01945561130736415, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.8707734809586, + "synthetic_score": 1286.5773759015594, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17952903281038537, + "power_sustain_score": 82.48858049186668, + "thermal_sustain_score": 67.81482500796537, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 17, + "interconnect_score": 3.91, + "server_quality_score": 85.09102164994961, + "composite_score": 1355.8707734809586 + } + }, + { + "index": 2, + "uuid": "GPU-82b32f5b-5fca-9674-a845-cfd5da365d09", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 32.5, + "p95_temp_c": 33, + "avg_power_w": 88.1, + "p95_power_w": 88.352, + "avg_graphics_clock_mhz": 2334, + "p95_graphics_clock_mhz": 2338.8, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0.1484190923366647, + "power_cv_pct": 0.2615600141158463, + "temp_cv_pct": 1.5384615384615385, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 68.78980891719745, + "p95_temp_c": 73, + "avg_power_w": 469.2394904458597, + "p95_power_w": 536.484, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86.62420382165605, + "avg_mem_usage_pct": 31.43949044585987, + "clock_cv_pct": 0, + "power_cv_pct": 31.66292861432794, + "temp_cv_pct": 11.039460335510705, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 71.5909090909091, + "p95_temp_c": 75, + "avg_power_w": 539.5713636363636, + "p95_power_w": 563.7595, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 37, + "clock_cv_pct": 0, + "power_cv_pct": 13.262409696722704, + "temp_cv_pct": 6.241951229578086, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 73.83333333333333, + "p95_temp_c": 74.15, + "avg_power_w": 530.9988888888889, + "p95_power_w": 562.8225, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 28.055555555555557, + "clock_cv_pct": 0, + "power_cv_pct": 10.415526227455187, + "temp_cv_pct": 0.6772009029345374, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 72.25, + "p95_temp_c": 73, + "avg_power_w": 517.3484999999998, + "p95_power_w": 526.722, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 24.25, + "clock_cv_pct": 0, + "power_cv_pct": 4.575214095271455, + "temp_cv_pct": 0.7421318543089003, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 72, + "p95_temp_c": 72, + "avg_power_w": 526.7316666666668, + "p95_power_w": 527.029, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32, + "clock_cv_pct": 0, + "power_cv_pct": 0.03465159564411575, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.8707734809586, + "synthetic_score": 1286.5773759015594, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17952903281038537, + "power_sustain_score": 78.7841487886799, + "thermal_sustain_score": 66.88161899346788, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 17, + "interconnect_score": 3.91, + "server_quality_score": 83.69973033464434, + "composite_score": 1355.8707734809586 + } + }, + { + "index": 3, + "uuid": "GPU-c88562a9-54cd-c3cf-c3fc-ef6c68ce5228", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4F:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 35, + "p95_temp_c": 35.85, + "avg_power_w": 86.56500000000001, + "p95_power_w": 86.99350000000001, + "avg_graphics_clock_mhz": 1813, + "p95_graphics_clock_mhz": 2360.95, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 52.00316164300109, + "power_cv_pct": 0.43901449005163734, + "temp_cv_pct": 2.0203050891044216, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 70.03821656050955, + "p95_temp_c": 74, + "avg_power_w": 468.4479617834392, + "p95_power_w": 537.146, + "avg_graphics_clock_mhz": 2422.1528662420383, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86, + "avg_mem_usage_pct": 32.18471337579618, + "clock_cv_pct": 0.04521783592046804, + "power_cv_pct": 31.741409651015406, + "temp_cv_pct": 10.54748733348162, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 72.95454545454545, + "p95_temp_c": 77, + "avg_power_w": 532.5427272727273, + "p95_power_w": 561.8395, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.45454545454545, + "avg_mem_usage_pct": 36.27272727272727, + "clock_cv_pct": 0, + "power_cv_pct": 18.061098204102745, + "temp_cv_pct": 7.868495345992694, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.5066113409025, + "weighted_teraops_per_sec": 327.3766528352256, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 74.66666666666667, + "p95_temp_c": 76, + "avg_power_w": 530.8477777777778, + "p95_power_w": 559.989, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 94.77777777777777, + "avg_mem_usage_pct": 27.22222222222222, + "clock_cv_pct": 0, + "power_cv_pct": 7.065475539013241, + "temp_cv_pct": 2.893187811789224, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 73.3, + "p95_temp_c": 74, + "avg_power_w": 515.2235000000002, + "p95_power_w": 523.9745, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 24, + "clock_cv_pct": 0, + "power_cv_pct": 3.7323488639278786, + "temp_cv_pct": 0.7595858612319264, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 73, + "p95_temp_c": 73, + "avg_power_w": 523.8044444444445, + "p95_power_w": 523.965, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 33, + "clock_cv_pct": 0, + "power_cv_pct": 0.019220287961704326, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.767206048869, + "synthetic_score": 1286.47380846947, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17954348577537482, + "power_sustain_score": 78.34139282874582, + "thermal_sustain_score": 68.35753799955515, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 16, + "interconnect_score": 3.91, + "server_quality_score": 84.0096792484903, + "composite_score": 1355.767206048869 + } + }, + { + "index": 4, + "uuid": "GPU-19d64ace-f127-d9a8-1999-ffe37453b930", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CB:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 32.25, + "p95_temp_c": 33, + "avg_power_w": 72.1925, + "p95_power_w": 85.2065, + "avg_graphics_clock_mhz": 1800, + "p95_graphics_clock_mhz": 2340, + "avg_memory_clock_mhz": 9462, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 51.96152422706633, + "power_cv_pct": 30.156655216791332, + "temp_cv_pct": 2.5710269692677516, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 64.73248407643312, + "p95_temp_c": 68, + "avg_power_w": 460.5487261146498, + "p95_power_w": 524.8340000000001, + "avg_graphics_clock_mhz": 2419.9108280254777, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86.35031847133757, + "avg_mem_usage_pct": 31.694267515923567, + "clock_cv_pct": 0.5339376530703055, + "power_cv_pct": 31.762270451577855, + "temp_cv_pct": 11.247647554456904, + "clock_drift_pct": 0.3472442778801136 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 67.81818181818181, + "p95_temp_c": 71.95, + "avg_power_w": 522.4672727272729, + "p95_power_w": 548.589, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.45454545454545, + "avg_mem_usage_pct": 38.18181818181818, + "clock_cv_pct": 0, + "power_cv_pct": 18.161439941591066, + "temp_cv_pct": 8.047362477106503, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.5066113409025, + "weighted_teraops_per_sec": 327.3766528352256, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 69.27777777777777, + "p95_temp_c": 71, + "avg_power_w": 517.7511111111112, + "p95_power_w": 547.6415, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 98.05555555555556, + "avg_mem_usage_pct": 28.944444444444443, + "clock_cv_pct": 0, + "power_cv_pct": 7.7114632118778434, + "temp_cv_pct": 2.755868528859595, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 67.6, + "p95_temp_c": 68.05, + "avg_power_w": 502.913, + "p95_power_w": 516.2669999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.15, + "avg_mem_usage_pct": 22.5, + "clock_cv_pct": 0, + "power_cv_pct": 5.810409162999742, + "temp_cv_pct": 1.4342248098864878, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 68, + "p95_temp_c": 68, + "avg_power_w": 516.5416666666666, + "p95_power_w": 516.783, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 35, + "clock_cv_pct": 0, + "power_cv_pct": 0.04028584882159023, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.767206048869, + "synthetic_score": 1286.47380846947, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17954348577537482, + "power_sustain_score": 76.20730137603232, + "thermal_sustain_score": 66.25705733662929, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 22, + "interconnect_score": 3.91, + "server_quality_score": 82.73930761379849, + "composite_score": 1355.767206048869 + } + }, + { + "index": 5, + "uuid": "GPU-8d5d3b52-6221-c572-e4dc-3eb34699d5a4", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CC:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 34.25, + "p95_temp_c": 35, + "avg_power_w": 73.3375, + "p95_power_w": 85.8015, + "avg_graphics_clock_mhz": 1782.75, + "p95_graphics_clock_mhz": 2317, + "avg_memory_clock_mhz": 9462, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 51.905659455541866, + "power_cv_pct": 28.961813248702985, + "temp_cv_pct": 2.4208940075586862, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 67.00636942675159, + "p95_temp_c": 71, + "avg_power_w": 464.2968152866239, + "p95_power_w": 528.3159999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86.73248407643312, + "avg_mem_usage_pct": 32.89171974522293, + "clock_cv_pct": 0, + "power_cv_pct": 31.71456153190515, + "temp_cv_pct": 10.633844797527264, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 71.0909090909091, + "p95_temp_c": 75, + "avg_power_w": 530.6718181818183, + "p95_power_w": 560.248, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.45454545454545, + "avg_mem_usage_pct": 37.13636363636363, + "clock_cv_pct": 0, + "power_cv_pct": 18.15550586767587, + "temp_cv_pct": 8.07957493551474, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 72.94444444444444, + "p95_temp_c": 74, + "avg_power_w": 526.0333333333333, + "p95_power_w": 558.8825, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 30.555555555555557, + "clock_cv_pct": 0, + "power_cv_pct": 11.312392089568855, + "temp_cv_pct": 1.0689770637942269, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 70.2, + "p95_temp_c": 71, + "avg_power_w": 511.89399999999995, + "p95_power_w": 520.6764999999999, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.5, + "avg_mem_usage_pct": 23.55, + "clock_cv_pct": 0, + "power_cv_pct": 2.1604346444422604, + "temp_cv_pct": 2.76221074496657, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 70, + "p95_temp_c": 70, + "avg_power_w": 520.6077777777778, + "p95_power_w": 520.8315, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 32.388888888888886, + "clock_cv_pct": 0, + "power_cv_pct": 0.03169570159890303, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.8707734809586, + "synthetic_score": 1286.5773759015594, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17952903281038537, + "power_sustain_score": 76.2549787725356, + "thermal_sustain_score": 68.0984656074182, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 19, + "interconnect_score": 3.91, + "server_quality_score": 83.30603331398613, + "composite_score": 1355.8707734809586 + } + }, + { + "index": 6, + "uuid": "GPU-a23c67ec-a8e2-7ebf-2593-79d73ec889a6", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CE:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 31.25, + "p95_temp_c": 32, + "avg_power_w": 73.7075, + "p95_power_w": 86.74, + "avg_graphics_clock_mhz": 1788.75, + "p95_graphics_clock_mhz": 2325, + "avg_memory_clock_mhz": 9462, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 51.925212889381434, + "power_cv_pct": 29.862341393273855, + "temp_cv_pct": 2.6532998322843198, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 66.35031847133757, + "p95_temp_c": 70, + "avg_power_w": 462.46401273885334, + "p95_power_w": 526.5980000000001, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86.73885350318471, + "avg_mem_usage_pct": 34.089171974522294, + "clock_cv_pct": 0, + "power_cv_pct": 31.7070851427136, + "temp_cv_pct": 11.184280711394349, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 68.5909090909091, + "p95_temp_c": 72, + "avg_power_w": 522.0795454545455, + "p95_power_w": 548.627, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.45454545454545, + "avg_mem_usage_pct": 38.18181818181818, + "clock_cv_pct": 0, + "power_cv_pct": 18.081421548128024, + "temp_cv_pct": 8.017459903596952, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 71.16666666666667, + "p95_temp_c": 72, + "avg_power_w": 519.4477777777778, + "p95_power_w": 548.031, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 31.38888888888889, + "clock_cv_pct": 0, + "power_cv_pct": 10.07170232052322, + "temp_cv_pct": 0.7025761124121781, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 69.2, + "p95_temp_c": 70, + "avg_power_w": 505.19000000000005, + "p95_power_w": 517.1045, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.05, + "avg_mem_usage_pct": 24.35, + "clock_cv_pct": 0, + "power_cv_pct": 4.481655194856258, + "temp_cv_pct": 2.8021270852117515, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 69, + "p95_temp_c": 69, + "avg_power_w": 517.5283333333333, + "p95_power_w": 517.769, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 34, + "clock_cv_pct": 0, + "power_cv_pct": 0.04081322462035067, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.8707734809586, + "synthetic_score": 1286.5773759015594, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17952903281038537, + "power_sustain_score": 75.4933057839041, + "thermal_sustain_score": 66.44715786581696, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 20, + "interconnect_score": 3.91, + "server_quality_score": 82.58213909491633, + "composite_score": 1355.8707734809586 + } + }, + { + "index": 7, + "uuid": "GPU-f9d537b7-86a1-407c-c137-3bc30fb8c2e8", + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CF:00.0", + "vbios": "98.02.67.00.0A", + "compute_capability": "12.0", + "backend": "cublasLt", + "status": "OK", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 2430, + "max_memory_clock_mhz": 12481, + "locked_graphics_clock_mhz": 2430, + "locked_memory_clock_mhz": 12481, + "baseline": { + "duration_sec": 16.34797981, + "samples": 4, + "avg_temp_c": 33.75, + "p95_temp_c": 34.85, + "avg_power_w": 72.055, + "p95_power_w": 84.75250000000001, + "avg_graphics_clock_mhz": 1794, + "p95_graphics_clock_mhz": 2332, + "avg_memory_clock_mhz": 9462, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 51.94221485351483, + "power_cv_pct": 29.630924486789787, + "temp_cv_pct": 3.228814032252351, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 724.937860289, + "samples": 157, + "avg_temp_c": 67.80891719745223, + "p95_temp_c": 71, + "avg_power_w": 461.598789808917, + "p95_power_w": 525.4, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 86.7452229299363, + "avg_mem_usage_pct": 33.76433121019108, + "clock_cv_pct": 0, + "power_cv_pct": 31.791537742385028, + "temp_cv_pct": 10.65023953983696, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "OK", + "steady": { + "duration_sec": 58.761884737, + "samples": 22, + "avg_temp_c": 71.0909090909091, + "p95_temp_c": 75, + "avg_power_w": 523.3618181818182, + "p95_power_w": 549.8835, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95.45454545454545, + "avg_mem_usage_pct": 37.22727272727273, + "clock_cv_pct": 0, + "power_cv_pct": 18.115883867382486, + "temp_cv_pct": 8.02372349977033, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 1309.9208810692608, + "weighted_teraops_per_sec": 327.4802202673152, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp8", + "status": "OK", + "steady": { + "duration_sec": 118.249988467, + "samples": 18, + "avg_temp_c": 73.22222222222223, + "p95_temp_c": 74, + "avg_power_w": 519.643888888889, + "p95_power_w": 549.0155, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 31, + "clock_cv_pct": 0, + "power_cv_pct": 10.41261444655753, + "temp_cv_pct": 0.7277437819897906, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 923.749016666112, + "weighted_teraops_per_sec": 230.937254166528, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp16", + "status": "OK", + "steady": { + "duration_sec": 178.550102114, + "samples": 20, + "avg_temp_c": 70.9, + "p95_temp_c": 72, + "avg_power_w": 505.99399999999997, + "p95_power_w": 517.3545, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 95, + "avg_mem_usage_pct": 24.5, + "clock_cv_pct": 0, + "power_cv_pct": 3.5486071584451433, + "temp_cv_pct": 2.6349142020126104, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 607.5168247338326, + "weighted_teraops_per_sec": 303.7584123669163, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + }, + { + "precision": "fp32", + "status": "OK", + "steady": { + "duration_sec": 231.450409797, + "samples": 18, + "avg_temp_c": 71, + "p95_temp_c": 71, + "avg_power_w": 517.5183333333332, + "p95_power_w": 517.706, + "avg_graphics_clock_mhz": 2422, + "p95_graphics_clock_mhz": 2422, + "avg_memory_clock_mhz": 12481, + "p95_memory_clock_mhz": 12481, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 34, + "clock_cv_pct": 0, + "power_cv_pct": 0.02004226308569274, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "teraops_per_sec": 424.4014891008, + "weighted_teraops_per_sec": 424.4014891008, + "ecc": { + "corrected": 0, + "uncorrected": 0 + } + } + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 0, + "sw_thermal_slowdown_us": 0, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "precision_results": [ + { + "name": "fp16_tensor", + "category": "fp16_bf16", + "supported": true, + "lanes": 16, + "m": 11904, + "n": 11904, + "k": 11904, + "iterations": 14672, + "teraops_per_sec": 164.99729101750273, + "weight": 0.5, + "weighted_teraops_per_sec": 82.49864550875137 + }, + { + "name": "fp32_tf32", + "category": "fp32_tf32", + "supported": true, + "lanes": 16, + "m": 8320, + "n": 8320, + "k": 8320, + "iterations": 14672, + "teraops_per_sec": 56.33366906197334, + "weight": 1, + "weighted_teraops_per_sec": 56.33366906197334 + }, + { + "name": "fp64", + "category": "fp64", + "supported": false, + "weight": 2, + "notes": "benchmark_disabled" + }, + { + "name": "fp8_e4m3", + "category": "fp8", + "supported": true, + "lanes": 16, + "m": 13696, + "n": 13696, + "k": 13696, + "iterations": 14672, + "teraops_per_sec": 251.2923694080546, + "weight": 0.25, + "weighted_teraops_per_sec": 62.82309235201365 + }, + { + "name": "fp8_e5m2", + "category": "fp8", + "supported": false, + "weight": 0.25, + "notes": "unsupported" + }, + { + "name": "int8_tensor", + "category": "int8", + "supported": true, + "lanes": 16, + "m": 10624, + "n": 10624, + "k": 10624, + "iterations": 14672, + "teraops_per_sec": 117.29034003436885, + "weight": 0.25, + "weighted_teraops_per_sec": 29.322585008592213 + } + ], + "scores": { + "compute_score": 1355.8707734809586, + "synthetic_score": 1286.5773759015594, + "mixed_score": 230.97799193133056, + "mixed_efficiency": 0.17952903281038537, + "power_sustain_score": 75.92713919839686, + "thermal_sustain_score": 68.04928138048912, + "stability_score": 100, + "thermal_throttle_pct": 0, + "power_cap_throttle_pct": 0, + "temp_headroom_c": 19, + "interconnect_score": 3.91, + "server_quality_score": 83.1929261736658, + "composite_score": 1355.8707734809586 + } + } + ], + "interconnect": { + "status": "OK", + "attempted": true, + "supported": true, + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "avg_algbw_gbps": 2.2125000000000004, + "max_algbw_gbps": 2.24, + "avg_busbw_gbps": 3.8725, + "max_busbw_gbps": 3.91 + }, + "server_power": { + "available": false, + "notes": [ + "IPMI power reading unavailable; server-side power characterization skipped" + ] + } +} \ No newline at end of file diff --git a/perf/perf-20260417-154119/result.json b/perf/perf-20260417-154119/result.json new file mode 100644 index 0000000..beda2f2 --- /dev/null +++ b/perf/perf-20260417-154119/result.json @@ -0,0 +1,1840 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-17T15:41:19.563694878Z", + "hostname": "debian", + "server_model": "CG480-S5063", + "benchmark_profile": "standard", + "parallel_gpus": true, + "ramp_total": 8, + "ramp_run_id": "ramp-20260417-151651", + "overall_status": "FAILED", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "findings": [ + "0 of 8 GPU(s) passed the benchmark.", + "GPU 0 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED.", + "GPU 1 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED.", + "GPU 2 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED.", + "GPU 3 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED.", + "GPU 4 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED.", + "GPU 5 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED.", + "GPU 6 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED.", + "GPU 7 had incomplete precision coverage: int8:FAILED, fp8:FAILED, fp16:FAILED, fp32:FAILED." + ], + "normalization": { + "status": "full", + "gpus": [ + { + "index": 0, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + }, + { + "index": 1, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + }, + { + "index": 2, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + }, + { + "index": 3, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + }, + { + "index": 4, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + }, + { + "index": 5, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + }, + { + "index": 6, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + }, + { + "index": 7, + "persistence_mode": "applied", + "gpu_clock_lock_mhz": 1785, + "gpu_clock_lock_status": "applied", + "memory_clock_lock_mhz": 3201, + "memory_clock_lock_status": "applied" + } + ] + }, + "host_config": { + "cpu_model": "Intel(R) Xeon(R) 6505P", + "cpu_sockets": 2, + "cpu_cores": 24, + "cpu_threads": 48, + "mem_total_gib": 125.17120742797852 + }, + "cpu_load": { + "avg_pct": 13.3, + "max_pct": 20.1, + "p95_pct": 19.1, + "samples": 65, + "status": "ok" + }, + "cooling": { + "available": true, + "avg_fan_rpm": 12551.062569676678, + "fan_duty_cycle_available": true, + "fan_duty_cycle_estimated": true, + "avg_fan_duty_cycle_pct": 74.86946212697437, + "p95_fan_duty_cycle_pct": 96.68469785575046, + "notes": [ + "fan duty cycle is estimated from the highest fan RPM observed since boot; treat it as an approximation, not a direct PWM reading" + ] + }, + "gpus": [ + { + "index": 0, + "uuid": "GPU-9514fbcc-bb3d-8faf-3e8b-f59b3dcd3bfb", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:10:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 42.5, + "p95_temp_c": 43.85, + "avg_power_w": 97.315, + "p95_power_w": 98.0395, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.8272106047371934, + "temp_cv_pct": 3.5294117647058822, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 61.8, + "p95_temp_c": 65.8, + "avg_power_w": 468.82244444444456, + "p95_power_w": 507.108, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 95.55555555555556, + "avg_mem_usage_pct": 43.111111111111114, + "clock_cv_pct": 0, + "power_cv_pct": 19.23666310098599, + "temp_cv_pct": 7.6629128954382075, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 56.69230769230769, + "p95_temp_c": 64, + "avg_power_w": 502.67538461538453, + "p95_power_w": 533.738, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 79.07692307692308, + "clock_cv_pct": 0, + "power_cv_pct": 15.340700843700555, + "temp_cv_pct": 13.206848694593024, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 66.1, + "p95_temp_c": 67, + "avg_power_w": 554.813, + "p95_power_w": 563.286, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 53.6, + "clock_cv_pct": 0, + "power_cv_pct": 2.4256976823456045, + "temp_cv_pct": 2.38725171528888, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 64.63636363636364, + "p95_temp_c": 67, + "avg_power_w": 516.5, + "p95_power_w": 562.2349999999999, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 91.27272727272727, + "avg_mem_usage_pct": 42.63636363636363, + "clock_cv_pct": 0, + "power_cv_pct": 9.649207157978053, + "temp_cv_pct": 3.862033816524888, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 63, + "p95_temp_c": 63, + "avg_power_w": 495.315, + "p95_power_w": 497.57349999999997, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 44.25, + "clock_cv_pct": 0, + "power_cv_pct": 0.3479587927999076, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 499976, + "sw_thermal_slowdown_us": 499976, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 79.1773266423819, + "thermal_sustain_score": 77.01126131368538, + "stability_score": 99.81049064033768, + "thermal_throttle_pct": 0.09475467983116138, + "power_cap_throttle_pct": 0.09475467983116138, + "temp_headroom_c": 24.200000000000003, + "interconnect_score": 0, + "server_quality_score": 86.78077264295526, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + }, + { + "index": 1, + "uuid": "GPU-bd48250e-65fc-018c-cad1-38b51deb8654", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:11:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 45, + "p95_temp_c": 46.8, + "avg_power_w": 101.125, + "p95_power_w": 101.9665, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.9245982694684818, + "temp_cv_pct": 4.444444444444445, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 65.33333333333333, + "p95_temp_c": 69, + "avg_power_w": 488.67600000000004, + "p95_power_w": 528.658, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 95.55555555555556, + "avg_mem_usage_pct": 43.24444444444445, + "clock_cv_pct": 0, + "power_cv_pct": 18.798043777423782, + "temp_cv_pct": 7.553777764621119, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 59.23076923076923, + "p95_temp_c": 67, + "avg_power_w": 514.8653846153846, + "p95_power_w": 545.828, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 79, + "clock_cv_pct": 0, + "power_cv_pct": 15.74138305807383, + "temp_cv_pct": 13.541413400246311, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 69.8, + "p95_temp_c": 71, + "avg_power_w": 578.1009999999999, + "p95_power_w": 587.2345, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 53.7, + "clock_cv_pct": 0, + "power_cv_pct": 2.6721987904928524, + "temp_cv_pct": 2.200901360420805, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 68.63636363636364, + "p95_temp_c": 71, + "avg_power_w": 539.5336363636363, + "p95_power_w": 587.6099999999999, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 91.18181818181819, + "avg_mem_usage_pct": 43.27272727272727, + "clock_cv_pct": 0, + "power_cv_pct": 9.66483315772293, + "temp_cv_pct": 3.6369616470850277, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 67, + "p95_temp_c": 67, + "avg_power_w": 518.345, + "p95_power_w": 520.1735, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 47.25, + "clock_cv_pct": 0, + "power_cv_pct": 0.41658246692557344, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 599991, + "sw_thermal_slowdown_us": 599991, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 78.62875189508861, + "thermal_sustain_score": 77.33866670613665, + "stability_score": 99.77258126347434, + "thermal_throttle_pct": 0.11370936826283333, + "power_cap_throttle_pct": 0.11370936826283333, + "temp_headroom_c": 21, + "interconnect_score": 0, + "server_quality_score": 86.69925808575731, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + }, + { + "index": 2, + "uuid": "GPU-eb2c2fb8-6cfb-8cc4-cfd7-9c5d2e6af0fe", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:37:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 44.5, + "p95_temp_c": 45.85, + "avg_power_w": 100.03, + "p95_power_w": 100.876, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0.9397180845746254, + "temp_cv_pct": 3.3707865168539324, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 63.48888888888889, + "p95_temp_c": 67, + "avg_power_w": 476.53400000000005, + "p95_power_w": 515.906, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 95.55555555555556, + "avg_mem_usage_pct": 43.48888888888889, + "clock_cv_pct": 0, + "power_cv_pct": 19.191615084599853, + "temp_cv_pct": 7.591104158300821, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 57, + "p95_temp_c": 65, + "avg_power_w": 494.6261538461539, + "p95_power_w": 533.464, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 92.3076923076923, + "avg_mem_usage_pct": 72.92307692307692, + "clock_cv_pct": 0, + "power_cv_pct": 23.348279478191564, + "temp_cv_pct": 15.433074708770722, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 67.3, + "p95_temp_c": 68, + "avg_power_w": 558.755, + "p95_power_w": 566.4755, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 53.5, + "clock_cv_pct": 0, + "power_cv_pct": 2.30306505897872, + "temp_cv_pct": 1.7643896117441185, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 66.72727272727273, + "p95_temp_c": 68, + "avg_power_w": 537.6118181818182, + "p95_power_w": 567.235, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 49.09090909090909, + "clock_cv_pct": 0, + "power_cv_pct": 5.885991260052247, + "temp_cv_pct": 2.1281334266775622, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 65, + "p95_temp_c": 65, + "avg_power_w": 502.59499999999997, + "p95_power_w": 504.221, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 46.25, + "clock_cv_pct": 0, + "power_cv_pct": 0.3359471213122686, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 499938, + "sw_thermal_slowdown_us": 499938, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 76.0950378110989, + "thermal_sustain_score": 77.22668752509753, + "stability_score": 99.81050504374038, + "thermal_throttle_pct": 0.09474747812981255, + "power_cap_throttle_pct": 0.09474747812981255, + "temp_headroom_c": 23, + "interconnect_score": 0, + "server_quality_score": 85.9207196183551, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + }, + { + "index": 3, + "uuid": "GPU-554e6f2c-13e9-fc9e-6aff-3bfe8148e3ac", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:38:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 43, + "p95_temp_c": 44.8, + "avg_power_w": 97.98, + "p95_power_w": 98.88000000000001, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.0206164523372117, + "temp_cv_pct": 4.651162790697675, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 62.044444444444444, + "p95_temp_c": 66, + "avg_power_w": 469.41733333333315, + "p95_power_w": 506.536, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 95.55555555555556, + "avg_mem_usage_pct": 43.53333333333333, + "clock_cv_pct": 0, + "power_cv_pct": 18.603656113661604, + "temp_cv_pct": 7.844248396404321, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 55.61538461538461, + "p95_temp_c": 63, + "avg_power_w": 480.88615384615383, + "p95_power_w": 518.248, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 92.3076923076923, + "avg_mem_usage_pct": 71.3076923076923, + "clock_cv_pct": 0, + "power_cv_pct": 23.280253452924775, + "temp_cv_pct": 15.282132577519375, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 65.9, + "p95_temp_c": 67, + "avg_power_w": 547.229, + "p95_power_w": 556.2850000000001, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 52.7, + "clock_cv_pct": 0, + "power_cv_pct": 2.662484706533015, + "temp_cv_pct": 2.394496788779893, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 64.9090909090909, + "p95_temp_c": 67, + "avg_power_w": 531.3863636363636, + "p95_power_w": 555.175, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 70, + "clock_cv_pct": 0, + "power_cv_pct": 4.786766568300306, + "temp_cv_pct": 3.565244274890156, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 62, + "p95_temp_c": 62, + "avg_power_w": 504.3775, + "p95_power_w": 506.0845, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 97.75, + "clock_cv_pct": 0, + "power_cv_pct": 0.27955383595035244, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 599992, + "sw_thermal_slowdown_us": 599992, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 76.74320607721866, + "thermal_sustain_score": 76.46725481078704, + "stability_score": 99.77258088443742, + "thermal_throttle_pct": 0.11370955778128987, + "power_cap_throttle_pct": 0.11370955778128987, + "temp_headroom_c": 24, + "interconnect_score": 0, + "server_quality_score": 85.87217062017668, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + }, + { + "index": 4, + "uuid": "GPU-fcacb1de-4691-5cce-a38e-a193d88d7f77", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:8F:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 45, + "p95_temp_c": 46.8, + "avg_power_w": 102.435, + "p95_power_w": 103.38449999999999, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 1.0299214135793429, + "temp_cv_pct": 4.444444444444445, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 67.04444444444445, + "p95_temp_c": 70, + "avg_power_w": 503.0633333333334, + "p95_power_w": 539.196, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 94.13333333333334, + "avg_mem_usage_pct": 47.06666666666667, + "clock_cv_pct": 0, + "power_cv_pct": 20.99256889123879, + "temp_cv_pct": 7.4938176418875795, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 57.69230769230769, + "p95_temp_c": 66, + "avg_power_w": 506.95846153846145, + "p95_power_w": 551.5600000000001, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 92.3076923076923, + "avg_mem_usage_pct": 72.92307692307692, + "clock_cv_pct": 0, + "power_cv_pct": 23.340903336422265, + "temp_cv_pct": 15.657444093962319, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 68.9, + "p95_temp_c": 70, + "avg_power_w": 581.2620000000001, + "p95_power_w": 590.2625, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 53.6, + "clock_cv_pct": 0, + "power_cv_pct": 2.54415611867442, + "temp_cv_pct": 2.2902371317938313, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 68.72727272727273, + "p95_temp_c": 71, + "avg_power_w": 563.2963636363637, + "p95_power_w": 591.37, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 70.36363636363636, + "clock_cv_pct": 0, + "power_cv_pct": 5.34325196906135, + "temp_cv_pct": 3.4033545847271447, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 65.25, + "p95_temp_c": 65.85, + "avg_power_w": 528.115, + "p95_power_w": 529.024, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 98, + "clock_cv_pct": 0, + "power_cv_pct": 0.17344903498675804, + "temp_cv_pct": 0.6636209990685353, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 500008, + "sw_thermal_slowdown_us": 500008, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 76.4486796556414, + "thermal_sustain_score": 77.51854707433726, + "stability_score": 99.81047851115646, + "thermal_throttle_pct": 0.09476074442177093, + "power_cap_throttle_pct": 0.09476074442177093, + "temp_headroom_c": 20, + "interconnect_score": 0, + "server_quality_score": 86.1143594234562, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + }, + { + "index": 5, + "uuid": "GPU-ecb4d90e-0ece-a1e7-c0d5-271d304c4699", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:90:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 43.5, + "p95_temp_c": 44.85, + "avg_power_w": 93.75, + "p95_power_w": 97.611, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 4.576000000000007, + "temp_cv_pct": 3.4482758620689653, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 64.42222222222222, + "p95_temp_c": 67, + "avg_power_w": 486.561111111111, + "p95_power_w": 518.428, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 93.91111111111111, + "avg_mem_usage_pct": 47.422222222222224, + "clock_cv_pct": 0, + "power_cv_pct": 20.87603045254485, + "temp_cv_pct": 7.788767452172025, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 56.23076923076923, + "p95_temp_c": 64, + "avg_power_w": 493.1276923076922, + "p95_power_w": 532.274, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 92.3076923076923, + "avg_mem_usage_pct": 72.92307692307692, + "clock_cv_pct": 0, + "power_cv_pct": 23.41905944690355, + "temp_cv_pct": 15.72414013187525, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 66.6, + "p95_temp_c": 68, + "avg_power_w": 559.5139999999999, + "p95_power_w": 567.345, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 53.5, + "clock_cv_pct": 0, + "power_cv_pct": 2.440278136766094, + "temp_cv_pct": 2.1445731016645193, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 66, + "p95_temp_c": 68, + "avg_power_w": 541.8245454545454, + "p95_power_w": 568.165, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 70.36363636363636, + "clock_cv_pct": 0, + "power_cv_pct": 5.253750976085873, + "temp_cv_pct": 3.3570406630727105, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 63, + "p95_temp_c": 63, + "avg_power_w": 510.2925, + "p95_power_w": 512.052, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 97.75, + "clock_cv_pct": 0, + "power_cv_pct": 0.28016761975385435, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 600022, + "sw_thermal_slowdown_us": 600022, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 76.45505786536796, + "thermal_sustain_score": 76.63369764348393, + "stability_score": 99.77256951333003, + "thermal_throttle_pct": 0.11371524333498631, + "power_cap_throttle_pct": 0.11371524333498631, + "temp_headroom_c": 23, + "interconnect_score": 0, + "server_quality_score": 85.83565445798757, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + }, + { + "index": 6, + "uuid": "GPU-3a515237-7b67-0348-2d57-baa3936aca1c", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:B7:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 43.5, + "p95_temp_c": 44.85, + "avg_power_w": 91.945, + "p95_power_w": 98.1415, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 7.48817227690467, + "temp_cv_pct": 3.4482758620689653, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 63.888888888888886, + "p95_temp_c": 68, + "avg_power_w": 479.58555555555563, + "p95_power_w": 519.832, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 95.55555555555556, + "avg_mem_usage_pct": 45.44444444444444, + "clock_cv_pct": 0, + "power_cv_pct": 19.36181817888047, + "temp_cv_pct": 7.612545609822358, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 56.76923076923077, + "p95_temp_c": 65, + "avg_power_w": 492, + "p95_power_w": 533.042, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 92.3076923076923, + "avg_mem_usage_pct": 71.61538461538461, + "clock_cv_pct": 0, + "power_cv_pct": 23.323904491680764, + "temp_cv_pct": 15.953522362540005, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 67.3, + "p95_temp_c": 68.55, + "avg_power_w": 547.4779999999998, + "p95_power_w": 569.2435, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 54.7, + "clock_cv_pct": 0, + "power_cv_pct": 7.537292735081571, + "temp_cv_pct": 1.9990526072917847, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 67.63636363636364, + "p95_temp_c": 69, + "avg_power_w": 543.4218181818181, + "p95_power_w": 569.115, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 48.45454545454545, + "clock_cv_pct": 0, + "power_cv_pct": 5.105532606248768, + "temp_cv_pct": 2.0206043519318424, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 65.5, + "p95_temp_c": 66, + "avg_power_w": 514.1374999999999, + "p95_power_w": 515.1445, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 47, + "clock_cv_pct": 0, + "power_cv_pct": 0.19371300061215918, + "temp_cv_pct": 0.7633587786259541, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 600038, + "sw_thermal_slowdown_us": 600038, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 72.87966787478256, + "thermal_sustain_score": 77.16236317053293, + "stability_score": 99.77256344873942, + "thermal_throttle_pct": 0.11371827563029109, + "power_cap_throttle_pct": 0.11371827563029109, + "temp_headroom_c": 22, + "interconnect_score": 0, + "server_quality_score": 84.92163469309041, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + }, + { + "index": 7, + "uuid": "GPU-5ebe5195-b37b-2a61-3563-b50fd3b3b736", + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:B8:00.0", + "vbios": "96.00.D9.00.0E", + "compute_capability": "9.0", + "status": "UNSUPPORTED", + "power_limit_w": 600, + "default_power_limit_w": 600, + "max_graphics_clock_mhz": 1785, + "max_memory_clock_mhz": 3201, + "locked_graphics_clock_mhz": 1785, + "locked_memory_clock_mhz": 3201, + "baseline": { + "duration_sec": 17.70195119, + "samples": 2, + "avg_temp_c": 42.5, + "p95_temp_c": 43.85, + "avg_power_w": 88.02, + "p95_power_w": 97.371, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 11.804135423767327, + "temp_cv_pct": 3.5294117647058822, + "clock_drift_pct": 0 + }, + "steady": { + "duration_sec": 527.65309417, + "samples": 45, + "avg_temp_c": 64.31111111111112, + "p95_temp_c": 67, + "avg_power_w": 483.15111111111116, + "p95_power_w": 513.216, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 94.04444444444445, + "avg_mem_usage_pct": 47.17777777777778, + "clock_cv_pct": 0, + "power_cv_pct": 20.70718453101131, + "temp_cv_pct": 7.9545354916488, + "clock_drift_pct": 0 + }, + "precision_steady": [ + { + "precision": "int8", + "status": "FAILED", + "steady": { + "duration_sec": 58.529044441, + "samples": 13, + "avg_temp_c": 55.92307692307692, + "p95_temp_c": 64, + "avg_power_w": 492.15923076923076, + "p95_power_w": 530.96, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 92.3076923076923, + "avg_mem_usage_pct": 72.92307692307692, + "clock_cv_pct": 0, + "power_cv_pct": 23.35025789536203, + "temp_cv_pct": 15.923934991725334, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp8", + "status": "FAILED", + "steady": { + "duration_sec": 115.978129508, + "samples": 10, + "avg_temp_c": 66.3, + "p95_temp_c": 67.55, + "avg_power_w": 557.518, + "p95_power_w": 565.1195, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 53.4, + "clock_cv_pct": 0, + "power_cv_pct": 2.3506960550068565, + "temp_cv_pct": 2.02920423032786, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp16", + "status": "FAILED", + "steady": { + "duration_sec": 179.082805727, + "samples": 11, + "avg_temp_c": 65.9090909090909, + "p95_temp_c": 68, + "avg_power_w": 540.4381818181818, + "p95_power_w": 565.825, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 70.18181818181819, + "clock_cv_pct": 0, + "power_cv_pct": 5.09693172900808, + "temp_cv_pct": 3.51115091347803, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + }, + { + "precision": "fp32", + "status": "FAILED", + "steady": { + "duration_sec": 204.385589702, + "samples": 4, + "avg_temp_c": 63, + "p95_temp_c": 63, + "avg_power_w": 509.42, + "p95_power_w": 511.6965, + "avg_graphics_clock_mhz": 1635, + "p95_graphics_clock_mhz": 1635, + "avg_memory_clock_mhz": 3201, + "p95_memory_clock_mhz": 3201, + "avg_usage_pct": 100, + "avg_mem_usage_pct": 97.25, + "clock_cv_pct": 0, + "power_cv_pct": 0.3365042478140501, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "notes": "phase produced no output" + } + ], + "precision_failures": [ + "int8:FAILED", + "fp8:FAILED", + "fp16:FAILED", + "fp32:FAILED" + ], + "cooldown": { + "duration_sec": 0, + "samples": 0, + "avg_temp_c": 0, + "p95_temp_c": 0, + "avg_power_w": 0, + "p95_power_w": 0, + "avg_graphics_clock_mhz": 0, + "p95_graphics_clock_mhz": 0, + "avg_memory_clock_mhz": 0, + "p95_memory_clock_mhz": 0, + "avg_usage_pct": 0, + "avg_mem_usage_pct": 0, + "clock_cv_pct": 0, + "power_cv_pct": 0, + "temp_cv_pct": 0, + "clock_drift_pct": 0 + }, + "throttle_counters": { + "sw_power_cap_us": 499987, + "sw_thermal_slowdown_us": 499987, + "sync_boost_us": 0, + "hw_thermal_slowdown_us": 0, + "hw_power_brake_slowdown_us": 0 + }, + "ecc": { + "corrected": 0, + "uncorrected": 0 + }, + "scores": { + "compute_score": 0, + "power_sustain_score": 76.64920755460673, + "thermal_sustain_score": 76.13639352505359, + "stability_score": 99.81048647093164, + "thermal_throttle_pct": 0.09475676453418341, + "power_cap_throttle_pct": 0.09475676453418341, + "temp_headroom_c": 23, + "interconnect_score": 0, + "server_quality_score": 85.75987491227076, + "composite_score": 0 + }, + "notes": [ + "precision plan failed: signal: killed" + ] + } + ], + "interconnect": { + "status": "UNSUPPORTED", + "attempted": true, + "supported": false, + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "notes": [ + "" + ] + }, + "server_power": { + "available": false, + "notes": [ + "IPMI power reading unavailable; server-side power characterization skipped" + ] + } +} \ No newline at end of file diff --git a/power/power-20260414-202612/result.json b/power/power-20260414-202612/result.json new file mode 100644 index 0000000..87d349f --- /dev/null +++ b/power/power-20260414-202612/result.json @@ -0,0 +1,42 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-14T20:26:13.061692275Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "standard", + "selected_gpu_indices": [ + 0 + ], + "recommended_slot_order": [ + 0 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 0 + ], + "total_observed_power_w": 600.33, + "avg_observed_power_w": 600.33, + "min_power_realization_pct": 100.01682691106228, + "avg_power_realization_pct": 100.01682691106228, + "status": "OK" + } + ], + "overall_status": "OK", + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 0." + ], + "gpus": [ + { + "index": 0, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.229, + "max_observed_temp_c": 78, + "calibration_attempts": 1, + "status": "OK" + } + ] +} \ No newline at end of file diff --git a/power/power-20260414-203047/result.json b/power/power-20260414-203047/result.json new file mode 100644 index 0000000..92916cd --- /dev/null +++ b/power/power-20260414-203047/result.json @@ -0,0 +1,74 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-14T20:30:47.900594506Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "standard", + "selected_gpu_indices": [ + 0, + 1 + ], + "recommended_slot_order": [ + 0, + 1 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 0 + ], + "total_observed_power_w": 600.315, + "avg_observed_power_w": 600.315, + "min_power_realization_pct": 100.00891278217911, + "avg_power_realization_pct": 100.00891278217911, + "status": "OK" + }, + { + "step_index": 2, + "gpu_indices": [ + 0, + 1 + ], + "total_observed_power_w": 1200.545, + "avg_observed_power_w": 600.2725, + "min_power_realization_pct": 99.99975010891087, + "avg_power_realization_pct": 100.0086224302427, + "status": "OK" + } + ], + "overall_status": "OK", + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 0,1." + ], + "gpus": [ + { + "index": 0, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.2615, + "max_observed_temp_c": 80, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 1 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 1 were populated; airflow in a different chassis fill pattern may differ." + }, + { + "index": 1, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.18, + "max_observed_temp_c": 80, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 0 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 0 were populated; airflow in a different chassis fill pattern may differ." + } + ] +} \ No newline at end of file diff --git a/power/power-20260414-203715/result.json b/power/power-20260414-203715/result.json new file mode 100644 index 0000000..35f8348 --- /dev/null +++ b/power/power-20260414-203715/result.json @@ -0,0 +1,106 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-14T20:37:15.331157966Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "standard", + "selected_gpu_indices": [ + 0, + 1, + 2 + ], + "recommended_slot_order": [ + 2, + 1, + 0 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 2 + ], + "total_observed_power_w": 600.34, + "avg_observed_power_w": 600.34, + "min_power_realization_pct": 100.00399789444225, + "avg_power_realization_pct": 100.00399789444225, + "status": "OK" + }, + { + "step_index": 2, + "gpu_indices": [ + 2, + 1 + ], + "total_observed_power_w": 1200.4384999999997, + "avg_observed_power_w": 600.2192499999999, + "min_power_realization_pct": 99.98342402916037, + "avg_power_realization_pct": 99.98800563327433, + "status": "OK" + }, + { + "step_index": 3, + "gpu_indices": [ + 2, + 1, + 0 + ], + "total_observed_power_w": 1800.6169999999997, + "avg_observed_power_w": 600.2056666666666, + "min_power_realization_pct": 99.97567947547624, + "avg_power_realization_pct": 99.98731186778974, + "status": "OK" + } + ], + "overall_status": "OK", + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 2,1,0." + ], + "gpus": [ + { + "index": 2, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.316, + "max_observed_temp_c": 78, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 0, + 1 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 0,1 were populated; airflow in a different chassis fill pattern may differ." + }, + { + "index": 1, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.2665, + "max_observed_temp_c": 80, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 0, + 2 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 0,2 were populated; airflow in a different chassis fill pattern may differ." + }, + { + "index": 0, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.263, + "max_observed_temp_c": 79, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 1, + 2 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 1,2 were populated; airflow in a different chassis fill pattern may differ." + } + ] +} \ No newline at end of file diff --git a/power/power-20260414-204624/result.json b/power/power-20260414-204624/result.json new file mode 100644 index 0000000..049365a --- /dev/null +++ b/power/power-20260414-204624/result.json @@ -0,0 +1,141 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-14T20:46:24.371826136Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "standard", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3 + ], + "recommended_slot_order": [ + 2, + 0, + 1, + 3 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 2 + ], + "total_observed_power_w": 600.234, + "avg_observed_power_w": 600.234, + "min_power_realization_pct": 100.00066641120904, + "avg_power_realization_pct": 100.00066641120904, + "status": "OK" + }, + { + "step_index": 2, + "gpu_indices": [ + 2, + 0 + ], + "total_observed_power_w": 1200.6415, + "avg_observed_power_w": 600.32075, + "min_power_realization_pct": 100.01924430689255, + "avg_power_realization_pct": 100.01949336948013, + "status": "OK" + }, + { + "step_index": 3, + "gpu_indices": [ + 2, + 0, + 1 + ], + "total_observed_power_w": 1800.88, + "avg_observed_power_w": 600.2933333333334, + "min_power_realization_pct": 100.01249645933652, + "avg_power_realization_pct": 100.01679993305292, + "status": "OK" + }, + { + "step_index": 4, + "gpu_indices": [ + 2, + 0, + 1, + 3 + ], + "total_observed_power_w": 2400.9950000000003, + "avg_observed_power_w": 600.2487500000001, + "min_power_realization_pct": 99.9960848341469, + "avg_power_realization_pct": 100.01093465827952, + "status": "OK" + } + ], + "overall_status": "OK", + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 2,0,1,3." + ], + "gpus": [ + { + "index": 2, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.23, + "max_observed_temp_c": 81, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 0, + 1, + 3 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 0,1,3 were populated; airflow in a different chassis fill pattern may differ." + }, + { + "index": 0, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.1775, + "max_observed_temp_c": 80, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 1, + 2, + 3 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 1,2,3 were populated; airflow in a different chassis fill pattern may differ." + }, + { + "index": 1, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.17, + "max_observed_temp_c": 81, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 0, + 2, + 3 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 0,2,3 were populated; airflow in a different chassis fill pattern may differ." + }, + { + "index": 3, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4F:00.0", + "applied_power_limit_w": 600, + "max_observed_power_w": 600.155, + "max_observed_temp_c": 80, + "calibration_attempts": 1, + "status": "OK", + "occupied_slots": [ + 0, + 1, + 2 + ], + "occupied_slots_note": "Slot recommendation was measured while slots 0,1,2 were populated; airflow in a different chassis fill pattern may differ." + } + ] +} \ No newline at end of file diff --git a/power/power-20260416-044811/result.json b/power/power-20260416-044811/result.json new file mode 100644 index 0000000..5312db3 --- /dev/null +++ b/power/power-20260416-044811/result.json @@ -0,0 +1,240 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-16T04:48:11.362162338Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "standard", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "recommended_slot_order": [ + 0, + 4, + 1, + 2, + 6, + 5, + 7, + 3 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 0 + ], + "new_gpu_index": 0, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.34, + "avg_observed_power_w": 600.34, + "status": "OK" + }, + { + "step_index": 2, + "gpu_indices": [ + 0, + 4 + ], + "new_gpu_index": 4, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.2125, + "avg_observed_power_w": 300.10625, + "status": "OK" + }, + { + "step_index": 3, + "gpu_indices": [ + 0, + 4, + 1 + ], + "new_gpu_index": 1, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.3019999999999, + "avg_observed_power_w": 200.10066666666663, + "status": "OK" + }, + { + "step_index": 4, + "gpu_indices": [ + 0, + 4, + 1, + 2 + ], + "new_gpu_index": 2, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.24, + "avg_observed_power_w": 150.06, + "status": "OK" + }, + { + "step_index": 5, + "gpu_indices": [ + 0, + 4, + 1, + 2, + 6 + ], + "new_gpu_index": 6, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.23, + "avg_observed_power_w": 120.046, + "status": "OK" + }, + { + "step_index": 6, + "gpu_indices": [ + 0, + 4, + 1, + 2, + 6, + 5 + ], + "new_gpu_index": 5, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.25, + "avg_observed_power_w": 100.04166666666667, + "status": "OK" + }, + { + "step_index": 7, + "gpu_indices": [ + 0, + 4, + 1, + 2, + 6, + 5, + 7 + ], + "new_gpu_index": 7, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.206, + "avg_observed_power_w": 85.74371428571429, + "status": "OK" + }, + { + "step_index": 8, + "gpu_indices": [ + 0, + 4, + 1, + 2, + 6, + 5, + 7, + 3 + ], + "new_gpu_index": 3, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.131, + "avg_observed_power_w": 75.016375, + "status": "OK" + } + ], + "overall_status": "OK", + "platform_max_tdp_w": 4800, + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 0,4,1,2,6,5,7,3." + ], + "gpus": [ + { + "index": 0, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.34, + "max_observed_temp_c": 77, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 4, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CB:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.3290000000001, + "max_observed_temp_c": 76, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 1, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.3225, + "max_observed_temp_c": 78, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 2, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.307, + "max_observed_temp_c": 77, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 6, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CE:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.3009999999999, + "max_observed_temp_c": 75, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 5, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CC:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.244, + "max_observed_temp_c": 76, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 7, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CF:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.231, + "max_observed_temp_c": 76, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 3, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4F:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.206, + "max_observed_temp_c": 78, + "calibration_attempts": 1, + "status": "OK" + } + ] +} \ No newline at end of file diff --git a/power/power-20260416-053129/result.json b/power/power-20260416-053129/result.json new file mode 100644 index 0000000..7fe627e --- /dev/null +++ b/power/power-20260416-053129/result.json @@ -0,0 +1,240 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-16T05:31:29.452895631Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "stability", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "recommended_slot_order": [ + 4, + 0, + 1, + 5, + 6, + 3, + 7, + 2 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 4 + ], + "new_gpu_index": 4, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.42, + "avg_observed_power_w": 600.42, + "status": "OK" + }, + { + "step_index": 2, + "gpu_indices": [ + 4, + 0 + ], + "new_gpu_index": 0, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.274, + "avg_observed_power_w": 300.137, + "status": "OK" + }, + { + "step_index": 3, + "gpu_indices": [ + 4, + 0, + 1 + ], + "new_gpu_index": 1, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.17, + "avg_observed_power_w": 200.05666666666664, + "status": "OK" + }, + { + "step_index": 4, + "gpu_indices": [ + 4, + 0, + 1, + 5 + ], + "new_gpu_index": 5, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.373, + "avg_observed_power_w": 150.09325, + "status": "OK" + }, + { + "step_index": 5, + "gpu_indices": [ + 4, + 0, + 1, + 5, + 6 + ], + "new_gpu_index": 6, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.179, + "avg_observed_power_w": 120.0358, + "status": "OK" + }, + { + "step_index": 6, + "gpu_indices": [ + 4, + 0, + 1, + 5, + 6, + 3 + ], + "new_gpu_index": 3, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.3275000000001, + "avg_observed_power_w": 100.05458333333335, + "status": "OK" + }, + { + "step_index": 7, + "gpu_indices": [ + 4, + 0, + 1, + 5, + 6, + 3, + 7 + ], + "new_gpu_index": 7, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.222, + "avg_observed_power_w": 85.746, + "status": "OK" + }, + { + "step_index": 8, + "gpu_indices": [ + 4, + 0, + 1, + 5, + 6, + 3, + 7, + 2 + ], + "new_gpu_index": 2, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.18, + "avg_observed_power_w": 75.0225, + "status": "OK" + } + ], + "overall_status": "OK", + "platform_max_tdp_w": 4800, + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 4,0,1,5,6,3,7,2." + ], + "gpus": [ + { + "index": 4, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CB:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.42, + "max_observed_temp_c": 74, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 0, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.362, + "max_observed_temp_c": 79, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 1, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.3580000000001, + "max_observed_temp_c": 79.19999999999999, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 5, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CC:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.354, + "max_observed_temp_c": 77, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 6, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CE:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.3425, + "max_observed_temp_c": 76, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 3, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4F:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.34, + "max_observed_temp_c": 79, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 7, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CF:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.31, + "max_observed_temp_c": 77, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 2, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.2864999999999, + "max_observed_temp_c": 78, + "calibration_attempts": 1, + "status": "OK" + } + ] +} \ No newline at end of file diff --git a/power/power-20260416-223651/result.json b/power/power-20260416-223651/result.json new file mode 100644 index 0000000..de6e55f --- /dev/null +++ b/power/power-20260416-223651/result.json @@ -0,0 +1,248 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-16T22:36:52.086533445Z", + "hostname": "debian", + "server_model": "G5500 V7", + "benchmark_profile": "stability", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "recommended_slot_order": [ + 5, + 3, + 7, + 4, + 2, + 0, + 1, + 6 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 5 + ], + "new_gpu_index": 5, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 600.36, + "avg_observed_power_w": 600.36, + "status": "OK" + }, + { + "step_index": 2, + "gpu_indices": [ + 5, + 3 + ], + "new_gpu_index": 3, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 1200.4969999999998, + "avg_observed_power_w": 600.2484999999999, + "status": "OK" + }, + { + "step_index": 3, + "gpu_indices": [ + 5, + 3, + 7 + ], + "new_gpu_index": 7, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 1800.744, + "avg_observed_power_w": 600.2479999999999, + "status": "OK" + }, + { + "step_index": 4, + "gpu_indices": [ + 5, + 3, + 7, + 4 + ], + "new_gpu_index": 4, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 2401.026, + "avg_observed_power_w": 600.2565, + "status": "OK" + }, + { + "step_index": 5, + "gpu_indices": [ + 5, + 3, + 7, + 4, + 2 + ], + "new_gpu_index": 2, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 3001.1769999999997, + "avg_observed_power_w": 600.2353999999999, + "status": "OK" + }, + { + "step_index": 6, + "gpu_indices": [ + 5, + 3, + 7, + 4, + 2, + 0 + ], + "new_gpu_index": 0, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 3601.5295, + "avg_observed_power_w": 600.2549166666666, + "status": "OK" + }, + { + "step_index": 7, + "gpu_indices": [ + 5, + 3, + 7, + 4, + 2, + 0, + 1 + ], + "new_gpu_index": 1, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 4201.840000000001, + "avg_observed_power_w": 600.2628571428573, + "status": "OK" + }, + { + "step_index": 8, + "gpu_indices": [ + 5, + 3, + 7, + 4, + 2, + 0, + 1, + 6 + ], + "new_gpu_index": 6, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 4801.788, + "avg_observed_power_w": 600.2235, + "status": "OK" + } + ], + "overall_status": "OK", + "platform_max_tdp_w": 4800, + "server_power": { + "available": true, + "idle_w": 892, + "loaded_w": 4314.026785714285, + "delta_w": 3422.0267857142853, + "gpu_reported_sum_w": 4800, + "reporting_ratio": 0.7129222470238095 + }, + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 5,3,7,4,2,0,1,6." + ], + "gpus": [ + { + "index": 5, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CC:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.36, + "max_observed_temp_c": 79, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 3, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4F:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.3225, + "max_observed_temp_c": 80, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 7, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CF:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.31, + "max_observed_temp_c": 78.5, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 4, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CB:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.2769999999999, + "max_observed_temp_c": 75, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 2, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4E:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.24, + "max_observed_temp_c": 79, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 0, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4B:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.2385, + "max_observed_temp_c": 79, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 1, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:4C:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.23, + "max_observed_temp_c": 80, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 6, + "name": "NVIDIA RTX PRO 6000 Blackwell Server Edition", + "bus_id": "00000000:CE:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 600.207, + "max_observed_temp_c": 77.69999999999999, + "calibration_attempts": 1, + "status": "OK" + } + ] +} \ No newline at end of file diff --git a/power/power-20260417-150143/result.json b/power/power-20260417-150143/result.json new file mode 100644 index 0000000..c2c6def --- /dev/null +++ b/power/power-20260417-150143/result.json @@ -0,0 +1,248 @@ +{ + "benchmark_version": "2", + "generated_at": "2026-04-17T15:01:44.215985718Z", + "hostname": "debian", + "server_model": "CG480-S5063", + "benchmark_profile": "standard", + "selected_gpu_indices": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7 + ], + "recommended_slot_order": [ + 4, + 6, + 1, + 5, + 7, + 3, + 2, + 0 + ], + "ramp_steps": [ + { + "step_index": 1, + "gpu_indices": [ + 4 + ], + "new_gpu_index": 4, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 536.5079999999999, + "avg_observed_power_w": 536.5079999999999, + "status": "OK" + }, + { + "step_index": 2, + "gpu_indices": [ + 4, + 6 + ], + "new_gpu_index": 6, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 1069.88, + "avg_observed_power_w": 534.94, + "status": "OK" + }, + { + "step_index": 3, + "gpu_indices": [ + 4, + 6, + 1 + ], + "new_gpu_index": 1, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 1598.971, + "avg_observed_power_w": 532.9903333333333, + "status": "OK" + }, + { + "step_index": 4, + "gpu_indices": [ + 4, + 6, + 1, + 5 + ], + "new_gpu_index": 5, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 2123.74, + "avg_observed_power_w": 530.935, + "status": "OK" + }, + { + "step_index": 5, + "gpu_indices": [ + 4, + 6, + 1, + 5, + 7 + ], + "new_gpu_index": 7, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 2643.2739999999994, + "avg_observed_power_w": 528.6547999999999, + "status": "OK" + }, + { + "step_index": 6, + "gpu_indices": [ + 4, + 6, + 1, + 5, + 7, + 3 + ], + "new_gpu_index": 3, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 3167.317, + "avg_observed_power_w": 527.8861666666667, + "status": "OK" + }, + { + "step_index": 7, + "gpu_indices": [ + 4, + 6, + 1, + 5, + 7, + 3, + 2 + ], + "new_gpu_index": 2, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 3696.143, + "avg_observed_power_w": 528.0204285714286, + "status": "OK" + }, + { + "step_index": 8, + "gpu_indices": [ + 4, + 6, + 1, + 5, + 7, + 3, + 2, + 0 + ], + "new_gpu_index": 0, + "new_gpu_stable_limit_w": 600, + "total_observed_power_w": 4204.626, + "avg_observed_power_w": 525.57825, + "status": "OK" + } + ], + "overall_status": "OK", + "platform_max_tdp_w": 4800, + "server_power": { + "available": true, + "idle_w": 616, + "loaded_w": 1901.0058479532163, + "delta_w": 1285.0058479532163, + "gpu_reported_sum_w": 4800, + "reporting_ratio": 0.26770955165692006 + }, + "findings": [ + "Recommended slot order for installation based on single-card targeted_power: 4,6,1,5,7,3,2,0." + ], + "gpus": [ + { + "index": 4, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:8F:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 536.5079999999999, + "max_observed_temp_c": 69.95, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 6, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:B7:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 532.666, + "max_observed_temp_c": 70, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 1, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:11:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 530.1025, + "max_observed_temp_c": 70, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 5, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:90:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 525.725, + "max_observed_temp_c": 68, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 7, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:B8:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 523.176, + "max_observed_temp_c": 69, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 3, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:38:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 520.5989999999999, + "max_observed_temp_c": 68, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 2, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:37:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 520.3979999999999, + "max_observed_temp_c": 68, + "calibration_attempts": 1, + "status": "OK" + }, + { + "index": 0, + "name": "NVIDIA H200 NVL", + "bus_id": "00000000:10:00.0", + "applied_power_limit_w": 600, + "stable_power_limit_w": 600, + "max_observed_power_w": 515.665, + "max_observed_temp_c": 67, + "calibration_attempts": 1, + "status": "OK" + } + ] +} \ No newline at end of file