Files
pub-beebench/perf/perf-20260416-114112/result.json
Mikhail Chusavitin 13eb0e5548 v8 bench result push
2026-04-16 13:01:42 +03:00

1238 lines
38 KiB
JSON

{
"benchmark_version": "2",
"generated_at": "2026-04-16T11:41:12.543280058Z",
"hostname": "debian",
"server_model": "MLT-S06",
"benchmark_profile": "standard",
"parallel_gpus": true,
"ramp_total": 4,
"ramp_run_id": "ramp-20260416-105042",
"overall_status": "OK",
"selected_gpu_indices": [
0,
1,
2,
3
],
"findings": [
"All 4 GPU(s) passed the benchmark.",
"GPU 0 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 0: p95 temperature 83.0°C — only 7.0°C from shutdown threshold (90°C). Do not operate.",
"GPU 1 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 1: p95 temperature 84.0°C — only 6.0°C from shutdown threshold (90°C). Do not operate.",
"GPU 2 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 2: p95 temperature 82.0°C — only 8.0°C from shutdown threshold (90°C). Do not operate.",
"GPU 3 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 3: p95 temperature 81.0°C — only 9.0°C from shutdown threshold (90°C). Do not operate.",
"Multi-GPU all_reduce max bus bandwidth: 8.5 GB/s."
],
"normalization": {
"status": "full",
"gpus": [
{
"index": 0,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
},
{
"index": 1,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
},
{
"index": 2,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
},
{
"index": 3,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
}
]
},
"host_config": {
"cpu_model": "Intel(R) Xeon(R) Gold 6430",
"cpu_sockets": 2,
"cpu_cores": 64,
"cpu_threads": 128,
"mem_total_gib": 62.53376007080078
},
"cpu_load": {
"avg_pct": 2.3,
"max_pct": 3.4,
"p95_pct": 3.3,
"samples": 97,
"status": "ok"
},
"cooling": {
"available": true,
"avg_fan_rpm": 6615.8536585365855,
"fan_duty_cycle_available": true,
"fan_duty_cycle_estimated": true,
"avg_fan_duty_cycle_pct": 88.43895180023259,
"p95_fan_duty_cycle_pct": 93.25892857142858,
"notes": [
"fan duty cycle is estimated from the highest fan RPM observed since boot; treat it as an approximation, not a direct PWM reading"
]
},
"gpus": [
{
"index": 0,
"uuid": "GPU-a87b1588-4e92-bd7b-74be-9db000808a64",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:49:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 17.385049678,
"samples": 1,
"avg_temp_c": 75,
"p95_temp_c": 75,
"avg_power_w": 197.2,
"p95_power_w": 197.2,
"avg_graphics_clock_mhz": 1830,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 662.836358356,
"samples": 20,
"avg_temp_c": 81.95,
"p95_temp_c": 83,
"avg_power_w": 675.5280000000001,
"p95_power_w": 700.8689999999999,
"avg_graphics_clock_mhz": 1236.75,
"p95_graphics_clock_mhz": 1317.0000000000005,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 95,
"avg_mem_usage_pct": 54.3,
"clock_cv_pct": 11.585634603268,
"power_cv_pct": 14.608602041360047,
"temp_cv_pct": 3.730772604322257,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 49.409457157,
"samples": 2,
"avg_temp_c": 56,
"p95_temp_c": 62.3,
"avg_power_w": 449.65,
"p95_power_w": 673.525,
"avg_graphics_clock_mhz": 1522.5,
"p95_graphics_clock_mhz": 1799.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 51.5,
"avg_mem_usage_pct": 43.5,
"clock_cv_pct": 20.19704433497537,
"power_cv_pct": 55.32080507061047,
"temp_cv_pct": 12.5,
"clock_drift_pct": 0
},
"teraops_per_sec": 1151.2555751079935,
"weighted_teraops_per_sec": 287.8138937769984,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 98.16537359,
"samples": 2,
"avg_temp_c": 70.5,
"p95_temp_c": 72.75,
"avg_power_w": 698.5250000000001,
"p95_power_w": 699.2765,
"avg_graphics_clock_mhz": 1192.5,
"p95_graphics_clock_mhz": 1199.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 75.5,
"clock_cv_pct": 0.628930817610063,
"power_cv_pct": 0.11953759707955755,
"temp_cv_pct": 3.546099290780142,
"clock_drift_pct": 0
},
"teraops_per_sec": 1418.4876727074816,
"weighted_teraops_per_sec": 354.6219181768704,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 167.856971671,
"samples": 3,
"avg_temp_c": 76.66666666666667,
"p95_temp_c": 77.9,
"avg_power_w": 697.9433333333333,
"p95_power_w": 698.0640000000001,
"avg_graphics_clock_mhz": 1135,
"p95_graphics_clock_mhz": 1140,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 64.33333333333333,
"clock_cv_pct": 0.6230015693273546,
"power_cv_pct": 0.019899100362495255,
"temp_cv_pct": 1.6268075594669307,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 213.685132072,
"samples": 2,
"avg_temp_c": 78.5,
"p95_temp_c": 78.95,
"avg_power_w": 699.62,
"p95_power_w": 700.061,
"avg_graphics_clock_mhz": 1185,
"p95_graphics_clock_mhz": 1185,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 100,
"clock_cv_pct": 0,
"power_cv_pct": 0.07003802063977718,
"temp_cv_pct": 0.6369426751592357,
"clock_drift_pct": 0
},
"teraops_per_sec": 329.0028834816,
"weighted_teraops_per_sec": 329.0028834816,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 199977,
"sw_thermal_slowdown_us": 199977,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 25760,
"teraops_per_sec": 221.17767359146666,
"weight": 0.5,
"weighted_teraops_per_sec": 110.58883679573333
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 25760,
"teraops_per_sec": 77.7925951488,
"weight": 1,
"weighted_teraops_per_sec": 77.7925951488
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 25760,
"teraops_per_sec": 338.9711491355989,
"weight": 0.25,
"weighted_teraops_per_sec": 84.74278728389973
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 25760,
"teraops_per_sec": 158.09760300018348,
"weight": 0.25,
"weighted_teraops_per_sec": 39.52440075004587
}
],
"scores": {
"compute_score": 1368.112084493708,
"synthetic_score": 1274.3174985001642,
"mixed_score": 312.6486199784789,
"mixed_efficiency": 0.24534593642985952,
"power_sustain_score": 74.84289396143863,
"thermal_sustain_score": 88.80768218703324,
"stability_score": 99.93966022005914,
"thermal_throttle_pct": 0.030169889970428448,
"power_cap_throttle_pct": 0.030169889970428448,
"temp_headroom_c": 7,
"interconnect_score": 8.51,
"server_quality_score": 89.07103693256522,
"composite_score": 1368.112084493708
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
},
{
"index": 1,
"uuid": "GPU-30b320aa-c18f-6b25-d0ed-24aeb14f1fd3",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:5A:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 17.385049678,
"samples": 1,
"avg_temp_c": 77,
"p95_temp_c": 77,
"avg_power_w": 195.54,
"p95_power_w": 195.54,
"avg_graphics_clock_mhz": 1830,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 662.836358356,
"samples": 20,
"avg_temp_c": 82.75,
"p95_temp_c": 84,
"avg_power_w": 675.284,
"p95_power_w": 698.549,
"avg_graphics_clock_mhz": 1200.75,
"p95_graphics_clock_mhz": 1260.0000000000005,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 95,
"avg_mem_usage_pct": 54.6,
"clock_cv_pct": 12.413713513714427,
"power_cv_pct": 13.360052051987486,
"temp_cv_pct": 2.6716242863364528,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 49.409457157,
"samples": 2,
"avg_temp_c": 59,
"p95_temp_c": 64.4,
"avg_power_w": 458.19500000000005,
"p95_power_w": 674.5415,
"avg_graphics_clock_mhz": 1507.5,
"p95_graphics_clock_mhz": 1797.75,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 50.5,
"avg_mem_usage_pct": 42,
"clock_cv_pct": 21.393034825870647,
"power_cv_pct": 52.463470793002976,
"temp_cv_pct": 10.16949152542373,
"clock_drift_pct": 0
},
"teraops_per_sec": 1148.3556870094847,
"weighted_teraops_per_sec": 287.08892175237116,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 98.16537359,
"samples": 2,
"avg_temp_c": 72,
"p95_temp_c": 73.8,
"avg_power_w": 698.045,
"p95_power_w": 699.0485,
"avg_graphics_clock_mhz": 1140,
"p95_graphics_clock_mhz": 1167,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 74,
"clock_cv_pct": 2.631578947368421,
"power_cv_pct": 0.15973182244697823,
"temp_cv_pct": 2.7777777777777777,
"clock_drift_pct": 0
},
"teraops_per_sec": 1416.711232290816,
"weighted_teraops_per_sec": 354.177808072704,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 167.856971671,
"samples": 3,
"avg_temp_c": 77.66666666666667,
"p95_temp_c": 78.9,
"avg_power_w": 698.4033333333333,
"p95_power_w": 698.7579999999999,
"avg_graphics_clock_mhz": 1105,
"p95_graphics_clock_mhz": 1110,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 61.666666666666664,
"clock_cv_pct": 0.6399156390828484,
"power_cv_pct": 0.04956354727495949,
"temp_cv_pct": 1.6058615393879574,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 213.685132072,
"samples": 2,
"avg_temp_c": 79.5,
"p95_temp_c": 79.95,
"avg_power_w": 698.665,
"p95_power_w": 698.7774999999999,
"avg_graphics_clock_mhz": 1155,
"p95_graphics_clock_mhz": 1155,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 100,
"clock_cv_pct": 0,
"power_cv_pct": 0.017891264053587916,
"temp_cv_pct": 0.628930817610063,
"clock_drift_pct": 0
},
"teraops_per_sec": 327.9836676096,
"weighted_teraops_per_sec": 327.9836676096,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 200032,
"sw_thermal_slowdown_us": 200032,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 24640,
"teraops_per_sec": 211.56125300053336,
"weight": 0.5,
"weighted_teraops_per_sec": 105.78062650026668
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 24640,
"teraops_per_sec": 74.4103084032,
"weight": 1,
"weighted_teraops_per_sec": 74.4103084032
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 24640,
"teraops_per_sec": 324.23327308622504,
"weight": 0.25,
"weighted_teraops_per_sec": 81.05831827155626
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 24640,
"teraops_per_sec": 151.22379417408854,
"weight": 0.25,
"weighted_teraops_per_sec": 37.805948543522135
}
],
"scores": {
"compute_score": 1361.845761014934,
"synthetic_score": 1272.1292004993704,
"mixed_score": 299.05520171854505,
"mixed_efficiency": 0.2350824126992383,
"power_sustain_score": 74.82961002466836,
"thermal_sustain_score": 91.98512714099064,
"stability_score": 99.9396436247112,
"thermal_throttle_pct": 0.030178187644402825,
"power_cap_throttle_pct": 0.030178187644402825,
"temp_headroom_c": 6,
"interconnect_score": 8.51,
"server_quality_score": 90.02027859958218,
"composite_score": 1361.845761014934
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
},
{
"index": 2,
"uuid": "GPU-0182c11c-0c2c-aafd-0ada-113b64147ee6",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:C8:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 17.385049678,
"samples": 1,
"avg_temp_c": 76,
"p95_temp_c": 76,
"avg_power_w": 164.84,
"p95_power_w": 164.84,
"avg_graphics_clock_mhz": 1830,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 662.836358356,
"samples": 20,
"avg_temp_c": 81.25,
"p95_temp_c": 82,
"avg_power_w": 675.9855,
"p95_power_w": 699.2245,
"avg_graphics_clock_mhz": 1206,
"p95_graphics_clock_mhz": 1288.5000000000005,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 95,
"avg_mem_usage_pct": 58,
"clock_cv_pct": 12.37171492617732,
"power_cv_pct": 13.413148128049624,
"temp_cv_pct": 2.7209465808534334,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 49.409457157,
"samples": 2,
"avg_temp_c": 57.5,
"p95_temp_c": 63.35,
"avg_power_w": 460.045,
"p95_power_w": 674.5464999999999,
"avg_graphics_clock_mhz": 1515,
"p95_graphics_clock_mhz": 1798.5,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 50,
"avg_mem_usage_pct": 43,
"clock_cv_pct": 20.792079207920793,
"power_cv_pct": 51.806888456564025,
"temp_cv_pct": 11.304347826086957,
"clock_drift_pct": 0
},
"teraops_per_sec": 1149.1842264662016,
"weighted_teraops_per_sec": 287.2960566165504,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 98.16537359,
"samples": 2,
"avg_temp_c": 71,
"p95_temp_c": 72.8,
"avg_power_w": 698.405,
"p95_power_w": 698.5625,
"avg_graphics_clock_mhz": 1147.5,
"p95_graphics_clock_mhz": 1181.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 73.5,
"clock_cv_pct": 3.2679738562091507,
"power_cv_pct": 0.0250570943793374,
"temp_cv_pct": 2.8169014084507045,
"clock_drift_pct": 0
},
"teraops_per_sec": 1417.5994524991488,
"weighted_teraops_per_sec": 354.3998631247872,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 167.856971671,
"samples": 3,
"avg_temp_c": 76.66666666666667,
"p95_temp_c": 77.9,
"avg_power_w": 698.4433333333333,
"p95_power_w": 698.761,
"avg_graphics_clock_mhz": 1120,
"p95_graphics_clock_mhz": 1125,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 62.333333333333336,
"clock_cv_pct": 0.6313453403451318,
"power_cv_pct": 0.057274192153024955,
"temp_cv_pct": 1.6268075594669307,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 213.685132072,
"samples": 2,
"avg_temp_c": 78.5,
"p95_temp_c": 78.95,
"avg_power_w": 699.605,
"p95_power_w": 699.9784999999999,
"avg_graphics_clock_mhz": 1162.5,
"p95_graphics_clock_mhz": 1169.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 100,
"clock_cv_pct": 0.6451612903225806,
"power_cv_pct": 0.059319187255660495,
"temp_cv_pct": 0.6369426751592357,
"clock_drift_pct": 0
},
"teraops_per_sec": 328.5951971328,
"weighted_teraops_per_sec": 328.5951971328,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 199451,
"sw_thermal_slowdown_us": 199451,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 24640,
"teraops_per_sec": 211.56125300053336,
"weight": 0.5,
"weighted_teraops_per_sec": 105.78062650026668
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 24640,
"teraops_per_sec": 74.4103084032,
"weight": 1,
"weighted_teraops_per_sec": 74.4103084032
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 24640,
"teraops_per_sec": 324.23327308622504,
"weight": 0.25,
"weighted_teraops_per_sec": 81.05831827155626
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 24640,
"teraops_per_sec": 151.22379417408854,
"weight": 0.25,
"weighted_teraops_per_sec": 37.805948543522135
}
],
"scores": {
"compute_score": 1362.8864804543962,
"synthetic_score": 1273.169919938833,
"mixed_score": 299.05520171854505,
"mixed_efficiency": 0.23489025073174255,
"power_sustain_score": 74.89376214465898,
"thermal_sustain_score": 91.8371602574397,
"stability_score": 99.93981893193225,
"thermal_throttle_pct": 0.030090534033873517,
"power_cap_throttle_pct": 0.030090534033873517,
"temp_headroom_c": 8,
"interconnect_score": 8.51,
"server_quality_score": 89.99520429340251,
"composite_score": 1362.8864804543962
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
},
{
"index": 3,
"uuid": "GPU-9ee0af22-3dda-6f5c-1a13-35c63f324216",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:D8:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 17.385049678,
"samples": 1,
"avg_temp_c": 74,
"p95_temp_c": 74,
"avg_power_w": 128.02,
"p95_power_w": 128.02,
"avg_graphics_clock_mhz": 1980,
"p95_graphics_clock_mhz": 1980,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 662.836358356,
"samples": 20,
"avg_temp_c": 79.6,
"p95_temp_c": 81,
"avg_power_w": 672.5364999999999,
"p95_power_w": 699.371,
"avg_graphics_clock_mhz": 1232.25,
"p95_graphics_clock_mhz": 1302.7500000000005,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 95,
"avg_mem_usage_pct": 54.8,
"clock_cv_pct": 11.48562205303889,
"power_cv_pct": 13.917412682040126,
"temp_cv_pct": 2.3300548983657547,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 49.409457157,
"samples": 2,
"avg_temp_c": 55.5,
"p95_temp_c": 61.35,
"avg_power_w": 454.36,
"p95_power_w": 674.293,
"avg_graphics_clock_mhz": 1522.5,
"p95_graphics_clock_mhz": 1799.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 50,
"avg_mem_usage_pct": 42.5,
"clock_cv_pct": 20.19704433497537,
"power_cv_pct": 53.78334360419051,
"temp_cv_pct": 11.711711711711711,
"clock_drift_pct": 0
},
"teraops_per_sec": 1148.7699567378434,
"weighted_teraops_per_sec": 287.19248918446084,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 98.16537359,
"samples": 2,
"avg_temp_c": 69,
"p95_temp_c": 70.8,
"avg_power_w": 698.125,
"p95_power_w": 698.7325,
"avg_graphics_clock_mhz": 1170,
"p95_graphics_clock_mhz": 1197,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 72,
"clock_cv_pct": 2.564102564102564,
"power_cv_pct": 0.09668755595344022,
"temp_cv_pct": 2.898550724637681,
"clock_drift_pct": 0
},
"teraops_per_sec": 1417.5994524991488,
"weighted_teraops_per_sec": 354.3998631247872,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 167.856971671,
"samples": 3,
"avg_temp_c": 74.66666666666667,
"p95_temp_c": 75.9,
"avg_power_w": 699.2833333333334,
"p95_power_w": 699.814,
"avg_graphics_clock_mhz": 1140,
"p95_graphics_clock_mhz": 1153.5,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 61.666666666666664,
"clock_cv_pct": 1.07433760648385,
"power_cv_pct": 0.06628059905455665,
"temp_cv_pct": 1.6703827619526521,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 213.685132072,
"samples": 2,
"avg_temp_c": 76.5,
"p95_temp_c": 76.95,
"avg_power_w": 698.54,
"p95_power_w": 698.963,
"avg_graphics_clock_mhz": 1177.5,
"p95_graphics_clock_mhz": 1184.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 100,
"clock_cv_pct": 0.6369426751592357,
"power_cv_pct": 0.06728319065479006,
"temp_cv_pct": 0.6535947712418301,
"clock_drift_pct": 0
},
"teraops_per_sec": 328.5951971328,
"weighted_teraops_per_sec": 328.5951971328,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 199962,
"sw_thermal_slowdown_us": 199962,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 25744,
"teraops_per_sec": 221.04029615445333,
"weight": 0.5,
"weighted_teraops_per_sec": 110.52014807722666
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 25744,
"teraops_per_sec": 77.74427676672,
"weight": 1,
"weighted_teraops_per_sec": 77.74427676672
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 25744,
"teraops_per_sec": 338.7606080491793,
"weight": 0.25,
"weighted_teraops_per_sec": 84.69015201229483
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 25744,
"teraops_per_sec": 157.99940573123925,
"weight": 0.25,
"weighted_teraops_per_sec": 39.49985143280981
}
],
"scores": {
"compute_score": 1366.8026809934588,
"synthetic_score": 1273.0663525067434,
"mixed_score": 312.4544282890513,
"mixed_efficiency": 0.2454345193192876,
"power_sustain_score": 74.8273114907529,
"thermal_sustain_score": 93.00983530490274,
"stability_score": 99.93966474606313,
"thermal_throttle_pct": 0.03016762696843544,
"power_cap_throttle_pct": 0.03016762696843544,
"temp_headroom_c": 9,
"interconnect_score": 8.51,
"server_quality_score": 90.32700993712194,
"composite_score": 1366.8026809934588
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
}
],
"interconnect": {
"status": "OK",
"attempted": true,
"supported": true,
"selected_gpu_indices": [
0,
1,
2,
3
],
"avg_algbw_gbps": 5.59,
"max_algbw_gbps": 5.67,
"avg_busbw_gbps": 8.3875,
"max_busbw_gbps": 8.51
},
"server_power": {
"available": false,
"notes": [
"IPMI power reading unavailable; server-side power characterization skipped"
]
}
}