Files
Mikhail Chusavitin 9880f77de7 add new mlt results
2026-04-16 15:35:51 +03:00

1238 lines
38 KiB
JSON

{
"benchmark_version": "2",
"generated_at": "2026-04-16T14:21:13.433467372Z",
"hostname": "debian",
"server_model": "MLT-S06",
"benchmark_profile": "standard",
"parallel_gpus": true,
"ramp_total": 4,
"ramp_run_id": "ramp-20260416-133118",
"overall_status": "OK",
"selected_gpu_indices": [
0,
1,
2,
3
],
"findings": [
"All 4 GPU(s) passed the benchmark.",
"GPU 0 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 0: p95 temperature 85.0°C — only 5.0°C from shutdown threshold (90°C). Do not operate.",
"GPU 1 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 1: p95 temperature 85.0°C — only 5.0°C from shutdown threshold (90°C). Do not operate.",
"GPU 2 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 2: p95 temperature 83.0°C — only 7.0°C from shutdown threshold (90°C). Do not operate.",
"GPU 3 average SM clock stayed below the requested lock target.",
"[HARD STOP] GPU 3: p95 temperature 82.0°C — only 8.0°C from shutdown threshold (90°C). Do not operate.",
"Multi-GPU all_reduce max bus bandwidth: 8.6 GB/s."
],
"normalization": {
"status": "full",
"gpus": [
{
"index": 0,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
},
{
"index": 1,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
},
{
"index": 2,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
},
{
"index": 3,
"persistence_mode": "applied",
"gpu_clock_lock_mhz": 1980,
"gpu_clock_lock_status": "applied",
"memory_clock_lock_mhz": 2619,
"memory_clock_lock_status": "applied"
}
]
},
"host_config": {
"cpu_model": "Intel(R) Xeon(R) Gold 6430",
"cpu_sockets": 2,
"cpu_cores": 64,
"cpu_threads": 128,
"mem_total_gib": 62.53376007080078
},
"cpu_load": {
"avg_pct": 2.5,
"max_pct": 3.4,
"p95_pct": 3.3,
"samples": 88,
"status": "ok"
},
"cooling": {
"available": true,
"avg_fan_rpm": 6445.138888888889,
"fan_duty_cycle_available": true,
"fan_duty_cycle_estimated": true,
"avg_fan_duty_cycle_pct": 87.26521164021146,
"p95_fan_duty_cycle_pct": 95.65252976190474,
"notes": [
"fan duty cycle is estimated from the highest fan RPM observed since boot; treat it as an approximation, not a direct PWM reading"
]
},
"gpus": [
{
"index": 0,
"uuid": "GPU-a87b1588-4e92-bd7b-74be-9db000808a64",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:49:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 20.487515832,
"samples": 1,
"avg_temp_c": 69,
"p95_temp_c": 69,
"avg_power_w": 181.66,
"p95_power_w": 181.66,
"avg_graphics_clock_mhz": 1830,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 715.865398029,
"samples": 21,
"avg_temp_c": 81.23809523809524,
"p95_temp_c": 85,
"avg_power_w": 629.2452380952379,
"p95_power_w": 697.96,
"avg_graphics_clock_mhz": 1300.7142857142858,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 85.71428571428571,
"avg_mem_usage_pct": 50.61904761904762,
"clock_cv_pct": 17.027510138414932,
"power_cv_pct": 25.700013778114617,
"temp_cv_pct": 8.408169321004037,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 51.349862924,
"samples": 2,
"avg_temp_c": 65.5,
"p95_temp_c": 70.45,
"avg_power_w": 458.21500000000003,
"p95_power_w": 675.1015,
"avg_graphics_clock_mhz": 1507.5,
"p95_graphics_clock_mhz": 1797.75,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 50.5,
"avg_mem_usage_pct": 42.5,
"clock_cv_pct": 21.393034825870647,
"power_cv_pct": 52.59212378468623,
"temp_cv_pct": 8.396946564885496,
"clock_drift_pct": 0
},
"teraops_per_sec": 1149.1842264662016,
"weighted_teraops_per_sec": 287.2960566165504,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 112.097913814,
"samples": 3,
"avg_temp_c": 76.66666666666667,
"p95_temp_c": 78.8,
"avg_power_w": 698.3166666666667,
"p95_power_w": 699.505,
"avg_graphics_clock_mhz": 1155,
"p95_graphics_clock_mhz": 1182,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 71.33333333333333,
"clock_cv_pct": 2.1207703400720157,
"power_cv_pct": 0.14121311398533568,
"temp_cv_pct": 2.6801800012908594,
"clock_drift_pct": 0
},
"teraops_per_sec": 1417.5994524991488,
"weighted_teraops_per_sec": 354.3998631247872,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 170.809433267,
"samples": 3,
"avg_temp_c": 80.33333333333333,
"p95_temp_c": 80.9,
"avg_power_w": 698.3166666666666,
"p95_power_w": 698.579,
"avg_graphics_clock_mhz": 1150,
"p95_graphics_clock_mhz": 1167,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 76,
"clock_cv_pct": 1.2297509238026914,
"power_cv_pct": 0.033365917310299316,
"temp_cv_pct": 0.5868106067938154,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 234.458143018,
"samples": 2,
"avg_temp_c": 81,
"p95_temp_c": 81,
"avg_power_w": 699.075,
"p95_power_w": 699.3315,
"avg_graphics_clock_mhz": 1185,
"p95_graphics_clock_mhz": 1185,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 100,
"clock_cv_pct": 0,
"power_cv_pct": 0.04076815792297321,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"teraops_per_sec": 329.0028834816,
"weighted_teraops_per_sec": 329.0028834816,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 100016,
"sw_thermal_slowdown_us": 100016,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 25760,
"teraops_per_sec": 221.17767359146666,
"weight": 0.5,
"weighted_teraops_per_sec": 110.58883679573333
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 25760,
"teraops_per_sec": 77.7925951488,
"weight": 1,
"weighted_teraops_per_sec": 77.7925951488
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 25760,
"teraops_per_sec": 338.9711491355989,
"weight": 0.25,
"weighted_teraops_per_sec": 84.74278728389973
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 25760,
"teraops_per_sec": 158.09760300018348,
"weight": 0.25,
"weighted_teraops_per_sec": 39.52440075004587
}
],
"scores": {
"compute_score": 1367.3721922811767,
"synthetic_score": 1273.577606287633,
"mixed_score": 312.6486199784789,
"mixed_efficiency": 0.2454884715583389,
"power_sustain_score": 74.83848960808605,
"thermal_sustain_score": 74.77549203698788,
"stability_score": 99.97205731684326,
"thermal_throttle_pct": 0.013971341578371458,
"power_cap_throttle_pct": 0.013971341578371458,
"temp_headroom_c": 5,
"interconnect_score": 8.55,
"server_quality_score": 84.87301742025949,
"composite_score": 1367.3721922811767
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
},
{
"index": 1,
"uuid": "GPU-30b320aa-c18f-6b25-d0ed-24aeb14f1fd3",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:5A:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 20.487515832,
"samples": 1,
"avg_temp_c": 71,
"p95_temp_c": 71,
"avg_power_w": 173.85,
"p95_power_w": 173.85,
"avg_graphics_clock_mhz": 1830,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 715.865398029,
"samples": 21,
"avg_temp_c": 82.61904761904762,
"p95_temp_c": 85,
"avg_power_w": 634.0671428571428,
"p95_power_w": 698.06,
"avg_graphics_clock_mhz": 1260,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 85.71428571428571,
"avg_mem_usage_pct": 52.714285714285715,
"clock_cv_pct": 18.78719361094068,
"power_cv_pct": 23.244958976113367,
"temp_cv_pct": 5.633692511025891,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 51.349862924,
"samples": 2,
"avg_temp_c": 68.5,
"p95_temp_c": 72.55,
"avg_power_w": 472.435,
"p95_power_w": 675.3625,
"avg_graphics_clock_mhz": 1492.5,
"p95_graphics_clock_mhz": 1796.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 50,
"avg_mem_usage_pct": 41.5,
"clock_cv_pct": 22.613065326633166,
"power_cv_pct": 47.72614222062294,
"temp_cv_pct": 6.569343065693431,
"clock_drift_pct": 0
},
"teraops_per_sec": 1146.6986080960512,
"weighted_teraops_per_sec": 286.6746520240128,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 112.097913814,
"samples": 3,
"avg_temp_c": 78.66666666666667,
"p95_temp_c": 79.9,
"avg_power_w": 697.9699999999999,
"p95_power_w": 698.582,
"avg_graphics_clock_mhz": 1085,
"p95_graphics_clock_mhz": 1134,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 67,
"clock_cv_pct": 3.9642051921855423,
"power_cv_pct": 0.08413735466916311,
"temp_cv_pct": 1.5854480452431954,
"clock_drift_pct": 0
},
"teraops_per_sec": 1414.9347918741505,
"weighted_teraops_per_sec": 353.7336979685376,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 170.809433267,
"samples": 3,
"avg_temp_c": 82,
"p95_temp_c": 82,
"avg_power_w": 698.6133333333333,
"p95_power_w": 698.958,
"avg_graphics_clock_mhz": 1095,
"p95_graphics_clock_mhz": 1095,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 74.66666666666667,
"clock_cv_pct": 0,
"power_cv_pct": 0.04337475447501179,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 234.458143018,
"samples": 2,
"avg_temp_c": 81,
"p95_temp_c": 81,
"avg_power_w": 649.905,
"p95_power_w": 662.7615000000001,
"avg_graphics_clock_mhz": 1072.5,
"p95_graphics_clock_mhz": 1079.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 99,
"clock_cv_pct": 0.6993006993006993,
"power_cv_pct": 2.1980135558273943,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"teraops_per_sec": 328.3913539584,
"weighted_teraops_per_sec": 328.3913539584,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 99988,
"sw_thermal_slowdown_us": 99988,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 24624,
"teraops_per_sec": 211.42387556352,
"weight": 0.5,
"weighted_teraops_per_sec": 105.71193778176
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 24624,
"teraops_per_sec": 74.36199002112,
"weight": 1,
"weighted_teraops_per_sec": 74.36199002112
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 24624,
"teraops_per_sec": 324.02273199980544,
"weight": 0.25,
"weighted_teraops_per_sec": 81.00568299995136
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 24624,
"teraops_per_sec": 151.1255969051443,
"weight": 0.25,
"weighted_teraops_per_sec": 37.78139922628608
}
],
"scores": {
"compute_score": 1361.336810024381,
"synthetic_score": 1271.678507015646,
"mixed_score": 298.86101002911744,
"mixed_efficiency": 0.23501302285156925,
"power_sustain_score": 73.25585575127133,
"thermal_sustain_score": 83.09892246692233,
"stability_score": 99.9720651395429,
"thermal_throttle_pct": 0.013967430228545486,
"power_cap_throttle_pct": 0.013967430228545486,
"temp_headroom_c": 5,
"interconnect_score": 8.55,
"server_quality_score": 86.89525952127526,
"composite_score": 1361.336810024381
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
},
{
"index": 2,
"uuid": "GPU-0182c11c-0c2c-aafd-0ada-113b64147ee6",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:C8:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 20.487515832,
"samples": 1,
"avg_temp_c": 66,
"p95_temp_c": 66,
"avg_power_w": 145.93,
"p95_power_w": 145.93,
"avg_graphics_clock_mhz": 1830,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 715.865398029,
"samples": 21,
"avg_temp_c": 80.61904761904762,
"p95_temp_c": 83,
"avg_power_w": 636.3133333333332,
"p95_power_w": 701.39,
"avg_graphics_clock_mhz": 1260,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 85.71428571428571,
"avg_mem_usage_pct": 50.19047619047619,
"clock_cv_pct": 18.653808797627907,
"power_cv_pct": 23.841801321120794,
"temp_cv_pct": 6.969375376219228,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 51.349862924,
"samples": 2,
"avg_temp_c": 66.5,
"p95_temp_c": 70.55,
"avg_power_w": 471.405,
"p95_power_w": 676.0065,
"avg_graphics_clock_mhz": 1500,
"p95_graphics_clock_mhz": 1797,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 50,
"avg_mem_usage_pct": 41.5,
"clock_cv_pct": 22,
"power_cv_pct": 48.224987006926106,
"temp_cv_pct": 6.7669172932330826,
"clock_drift_pct": 0
},
"teraops_per_sec": 1147.527147552768,
"weighted_teraops_per_sec": 286.881786888192,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 112.097913814,
"samples": 3,
"avg_temp_c": 76,
"p95_temp_c": 77.8,
"avg_power_w": 699.94,
"p95_power_w": 701.489,
"avg_graphics_clock_mhz": 1140,
"p95_graphics_clock_mhz": 1153.5,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 68.33333333333333,
"clock_cv_pct": 1.07433760648385,
"power_cv_pct": 0.18365617738503892,
"temp_cv_pct": 2.1486752129677,
"clock_drift_pct": 0
},
"teraops_per_sec": 1414.9347918741505,
"weighted_teraops_per_sec": 353.7336979685376,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 170.809433267,
"samples": 3,
"avg_temp_c": 79.66666666666667,
"p95_temp_c": 80,
"avg_power_w": 698.0733333333333,
"p95_power_w": 698.9,
"avg_graphics_clock_mhz": 1140,
"p95_graphics_clock_mhz": 1191,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 75,
"clock_cv_pct": 3.7216146378239348,
"power_cv_pct": 0.14423331175591858,
"temp_cv_pct": 0.5917211558046422,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 234.458143018,
"samples": 2,
"avg_temp_c": 80,
"p95_temp_c": 80,
"avg_power_w": 699.12,
"p95_power_w": 699.237,
"avg_graphics_clock_mhz": 1155,
"p95_graphics_clock_mhz": 1155,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 100,
"clock_cv_pct": 0,
"power_cv_pct": 0.018594804897584888,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"teraops_per_sec": 327.9836676096,
"weighted_teraops_per_sec": 327.9836676096,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 200011,
"sw_thermal_slowdown_us": 200012,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 24640,
"teraops_per_sec": 211.56125300053336,
"weight": 0.5,
"weighted_teraops_per_sec": 105.78062650026668
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 24640,
"teraops_per_sec": 74.4103084032,
"weight": 1,
"weighted_teraops_per_sec": 74.4103084032
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 24640,
"teraops_per_sec": 324.23327308622504,
"weight": 0.25,
"weighted_teraops_per_sec": 81.05831827155626
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 24640,
"teraops_per_sec": 151.22379417408854,
"weight": 0.25,
"weighted_teraops_per_sec": 37.805948543522135
}
],
"scores": {
"compute_score": 1361.1945160465887,
"synthetic_score": 1271.477955531025,
"mixed_score": 299.05520171854505,
"mixed_efficiency": 0.2352028207942044,
"power_sustain_score": 74.7401367794711,
"thermal_sustain_score": 79.09187387134232,
"stability_score": 99.94412036102018,
"thermal_throttle_pct": 0.027939889335438648,
"power_cap_throttle_pct": 0.02793974964437344,
"temp_headroom_c": 7,
"interconnect_score": 8.55,
"server_quality_score": 86.1272513396521,
"composite_score": 1361.1945160465887
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
},
{
"index": 3,
"uuid": "GPU-9ee0af22-3dda-6f5c-1a13-35c63f324216",
"name": "NVIDIA H100 80GB HBM3",
"bus_id": "00000000:D8:00.0",
"vbios": "96.00.74.00.01",
"compute_capability": "9.0",
"backend": "cublasLt",
"status": "OK",
"power_limit_w": 700,
"default_power_limit_w": 700,
"max_graphics_clock_mhz": 1980,
"max_memory_clock_mhz": 2619,
"locked_graphics_clock_mhz": 1980,
"locked_memory_clock_mhz": 2619,
"baseline": {
"duration_sec": 20.487515832,
"samples": 1,
"avg_temp_c": 64,
"p95_temp_c": 64,
"avg_power_w": 112.32,
"p95_power_w": 112.32,
"avg_graphics_clock_mhz": 1980,
"p95_graphics_clock_mhz": 1980,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"steady": {
"duration_sec": 715.865398029,
"samples": 21,
"avg_temp_c": 78.95238095238095,
"p95_temp_c": 82,
"avg_power_w": 615.5780952380953,
"p95_power_w": 699.76,
"avg_graphics_clock_mhz": 1307.142857142857,
"p95_graphics_clock_mhz": 1830,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 80.95238095238095,
"avg_mem_usage_pct": 47.476190476190474,
"clock_cv_pct": 19.6037061362318,
"power_cv_pct": 28.346418909802996,
"temp_cv_pct": 8.351205756656684,
"clock_drift_pct": 0
},
"precision_steady": [
{
"precision": "int8",
"status": "OK",
"steady": {
"duration_sec": 51.349862924,
"samples": 2,
"avg_temp_c": 64.5,
"p95_temp_c": 68.55,
"avg_power_w": 466.385,
"p95_power_w": 675.7744999999999,
"avg_graphics_clock_mhz": 1507.5,
"p95_graphics_clock_mhz": 1797.75,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 50,
"avg_mem_usage_pct": 41.5,
"clock_cv_pct": 21.393034825870647,
"power_cv_pct": 49.88475186809181,
"temp_cv_pct": 6.976744186046512,
"clock_drift_pct": 0
},
"teraops_per_sec": 1147.1128778244095,
"weighted_teraops_per_sec": 286.77821945610236,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp8",
"status": "OK",
"steady": {
"duration_sec": 112.097913814,
"samples": 3,
"avg_temp_c": 75,
"p95_temp_c": 76.8,
"avg_power_w": 698.8933333333334,
"p95_power_w": 699.885,
"avg_graphics_clock_mhz": 1140,
"p95_graphics_clock_mhz": 1167,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 66.66666666666667,
"clock_cv_pct": 2.1486752129677,
"power_cv_pct": 0.11879844120756695,
"temp_cv_pct": 2.1773242158072694,
"clock_drift_pct": 0
},
"teraops_per_sec": 1415.8230120824833,
"weighted_teraops_per_sec": 353.9557530206208,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp16",
"status": "OK",
"steady": {
"duration_sec": 170.809433267,
"samples": 3,
"avg_temp_c": 78.66666666666667,
"p95_temp_c": 79,
"avg_power_w": 698.1666666666666,
"p95_power_w": 698.7339999999999,
"avg_graphics_clock_mhz": 1145,
"p95_graphics_clock_mhz": 1167,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 74.66666666666667,
"clock_cv_pct": 1.6339115226087082,
"power_cv_pct": 0.0725584540138954,
"temp_cv_pct": 0.5992430349038538,
"clock_drift_pct": 0
},
"teraops_per_sec": 605.7576061293909,
"weighted_teraops_per_sec": 302.87880306469543,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
},
{
"precision": "fp32",
"status": "OK",
"steady": {
"duration_sec": 234.458143018,
"samples": 2,
"avg_temp_c": 79,
"p95_temp_c": 79,
"avg_power_w": 698.85,
"p95_power_w": 698.967,
"avg_graphics_clock_mhz": 1162.5,
"p95_graphics_clock_mhz": 1169.25,
"avg_memory_clock_mhz": 2619,
"p95_memory_clock_mhz": 2619,
"avg_usage_pct": 100,
"avg_mem_usage_pct": 100,
"clock_cv_pct": 0.6451612903225806,
"power_cv_pct": 0.01860198898189818,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"teraops_per_sec": 328.3913539584,
"weighted_teraops_per_sec": 328.3913539584,
"ecc": {
"corrected": 0,
"uncorrected": 0
}
}
],
"cooldown": {
"duration_sec": 0,
"samples": 0,
"avg_temp_c": 0,
"p95_temp_c": 0,
"avg_power_w": 0,
"p95_power_w": 0,
"avg_graphics_clock_mhz": 0,
"p95_graphics_clock_mhz": 0,
"avg_memory_clock_mhz": 0,
"p95_memory_clock_mhz": 0,
"avg_usage_pct": 0,
"avg_mem_usage_pct": 0,
"clock_cv_pct": 0,
"power_cv_pct": 0,
"temp_cv_pct": 0,
"clock_drift_pct": 0
},
"throttle_counters": {
"sw_power_cap_us": 200033,
"sw_thermal_slowdown_us": 200033,
"sync_boost_us": 0,
"hw_thermal_slowdown_us": 0,
"hw_power_brake_slowdown_us": 0
},
"ecc": {
"corrected": 0,
"uncorrected": 0
},
"precision_results": [
{
"name": "fp16_tensor",
"category": "fp16_bf16",
"supported": true,
"lanes": 16,
"m": 10880,
"n": 10880,
"k": 10880,
"iterations": 24640,
"teraops_per_sec": 211.56125300053336,
"weight": 0.5,
"weighted_teraops_per_sec": 105.78062650026668
},
{
"name": "fp32_tf32",
"category": "fp32_tf32",
"supported": true,
"lanes": 16,
"m": 7680,
"n": 7680,
"k": 7680,
"iterations": 24640,
"teraops_per_sec": 74.4103084032,
"weight": 1,
"weighted_teraops_per_sec": 74.4103084032
},
{
"name": "fp64",
"category": "fp64",
"supported": false,
"weight": 2,
"notes": "benchmark_disabled"
},
{
"name": "fp8_e4m3",
"category": "fp8",
"supported": true,
"lanes": 16,
"m": 12544,
"n": 12544,
"k": 12544,
"iterations": 24640,
"teraops_per_sec": 324.23327308622504,
"weight": 0.25,
"weighted_teraops_per_sec": 81.05831827155626
},
{
"name": "fp8_e5m2",
"category": "fp8",
"supported": false,
"weight": 0.25,
"notes": "unsupported"
},
{
"name": "int8_tensor",
"category": "int8",
"supported": true,
"lanes": 16,
"m": 9728,
"n": 9728,
"k": 9728,
"iterations": 24640,
"teraops_per_sec": 151.22379417408854,
"weight": 0.25,
"weighted_teraops_per_sec": 37.805948543522135
}
],
"scores": {
"compute_score": 1361.7206900153822,
"synthetic_score": 1272.0041294998186,
"mixed_score": 299.05520171854505,
"mixed_efficiency": 0.23510552739804425,
"power_sustain_score": 74.84253083684747,
"thermal_sustain_score": 74.94638273002994,
"stability_score": 99.94411435430439,
"thermal_throttle_pct": 0.027942822847808132,
"power_cap_throttle_pct": 0.027942822847808132,
"temp_headroom_c": 8,
"interconnect_score": 8.55,
"server_quality_score": 84.91431981178498,
"composite_score": 1361.7206900153822
},
"degradation_reasons": [
"low_sm_clock_vs_target"
]
}
],
"interconnect": {
"status": "OK",
"attempted": true,
"supported": true,
"selected_gpu_indices": [
0,
1,
2,
3
],
"avg_algbw_gbps": 5.61,
"max_algbw_gbps": 5.7,
"avg_busbw_gbps": 8.415,
"max_busbw_gbps": 8.55
},
"server_power": {
"available": false,
"notes": [
"IPMI power reading unavailable; server-side power characterization skipped"
]
}
}