2024-04-10
This commit is contained in:
575
gpu-benchmark-20260410-184145/result.json
Executable file
575
gpu-benchmark-20260410-184145/result.json
Executable file
@@ -0,0 +1,575 @@
|
||||
{
|
||||
"benchmark_version": "1",
|
||||
"generated_at": "2026-04-10T18:41:45.128862028Z",
|
||||
"hostname": "debian",
|
||||
"server_model": "G5500 V7",
|
||||
"benchmark_profile": "standard",
|
||||
"overall_status": "PARTIAL",
|
||||
"selected_gpu_indices": [
|
||||
0,
|
||||
1,
|
||||
2,
|
||||
3
|
||||
],
|
||||
"findings": [
|
||||
"All 4 GPU(s) passed the benchmark.",
|
||||
"Environment normalization was partial; compare results with caution.",
|
||||
"GPU 0 ran without full benchmark normalization.",
|
||||
"GPU 1 ran without full benchmark normalization.",
|
||||
"GPU 2 showed unstable clocks/power over the benchmark window.",
|
||||
"GPU 2 ran without full benchmark normalization.",
|
||||
"GPU 3 ran without full benchmark normalization.",
|
||||
"GPU power reporting may be unreliable: server delta 1310 W vs GPU-reported 2088 W (ratio 0.63). GPU telemetry likely over-reports actual consumption."
|
||||
],
|
||||
"warnings": [
|
||||
"gpu inventory query failed: nvidia-smi gpu info (index,uuid,name,pci.bus_id,vbios_version): exit status 2"
|
||||
],
|
||||
"normalization": {
|
||||
"status": "partial",
|
||||
"gpus": [
|
||||
{
|
||||
"index": 0,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 1,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 2,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 3,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
}
|
||||
]
|
||||
},
|
||||
"gpus": [
|
||||
{
|
||||
"index": 0,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.64054741,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 32,
|
||||
"p95_temp_c": 32,
|
||||
"avg_power_w": 35.71249999999999,
|
||||
"p95_power_w": 35.9375,
|
||||
"avg_graphics_clock_mhz": 180,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 0.38374434928010487,
|
||||
"temp_cv_pct": 0,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 517.039794776,
|
||||
"samples": 517,
|
||||
"avg_temp_c": 71.82978723404256,
|
||||
"p95_temp_c": 73,
|
||||
"avg_power_w": 526.566344294004,
|
||||
"p95_power_w": 537.342,
|
||||
"avg_graphics_clock_mhz": 2421.6382978723404,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.52417794970987,
|
||||
"avg_mem_usage_pct": 39.276595744680854,
|
||||
"clock_cv_pct": 0.33928654551992987,
|
||||
"power_cv_pct": 6.134300387584527,
|
||||
"temp_cv_pct": 1.6164905348919567,
|
||||
"clock_drift_pct": 0.059851874611918786
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.692879388,
|
||||
"samples": 117,
|
||||
"avg_temp_c": 45.46153846153846,
|
||||
"p95_temp_c": 54.19999999999999,
|
||||
"avg_power_w": 40.62282051282055,
|
||||
"p95_power_w": 55.827999999999996,
|
||||
"avg_graphics_clock_mhz": 200.30769230769232,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1643.5641025641025,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 95.08186420156572,
|
||||
"power_cv_pct": 13.397079812097019,
|
||||
"temp_cv_pct": 8.815261908432287,
|
||||
"clock_drift_pct": 31.35192004208311
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 86.25454929352739,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 432.9908197154495
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 1,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.648620713,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 33,
|
||||
"p95_temp_c": 33,
|
||||
"avg_power_w": 34.43125000000001,
|
||||
"p95_power_w": 34.83,
|
||||
"avg_graphics_clock_mhz": 180,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 0.49361738151609885,
|
||||
"temp_cv_pct": 0,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 517.039712514,
|
||||
"samples": 517,
|
||||
"avg_temp_c": 72.47969052224371,
|
||||
"p95_temp_c": 74,
|
||||
"avg_power_w": 525.4105029013539,
|
||||
"p95_power_w": 533.974,
|
||||
"avg_graphics_clock_mhz": 2422.015473887814,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.61315280464217,
|
||||
"avg_mem_usage_pct": 39.15860735009671,
|
||||
"clock_cv_pct": 0.014512672044927075,
|
||||
"power_cv_pct": 5.368261116854865,
|
||||
"temp_cv_pct": 1.8072124291831093,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.671014238,
|
||||
"samples": 117,
|
||||
"avg_temp_c": 45.38461538461539,
|
||||
"p95_temp_c": 54,
|
||||
"avg_power_w": 38.87683760683761,
|
||||
"p95_power_w": 53.337999999999994,
|
||||
"avg_graphics_clock_mhz": 189.5982905982906,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1643.5641025641025,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 46.5414056859924,
|
||||
"power_cv_pct": 13.395397467444464,
|
||||
"temp_cv_pct": 8.157534756058777,
|
||||
"clock_drift_pct": 17.934183593134943
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 89.20542707811056,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 436.2987496625886
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 2,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.646607951,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 28.625,
|
||||
"p95_temp_c": 29,
|
||||
"avg_power_w": 35.14999999999999,
|
||||
"p95_power_w": 35.15,
|
||||
"avg_graphics_clock_mhz": 180,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 2.0214587077101006e-14,
|
||||
"temp_cv_pct": 1.6912591031473436,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 517.039507345,
|
||||
"samples": 517,
|
||||
"avg_temp_c": 70.29013539651838,
|
||||
"p95_temp_c": 73,
|
||||
"avg_power_w": 519.9781431334626,
|
||||
"p95_power_w": 529.014,
|
||||
"avg_graphics_clock_mhz": 2418.79497098646,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.42166344294004,
|
||||
"avg_mem_usage_pct": 39.353965183752415,
|
||||
"clock_cv_pct": 3.0099394503204846,
|
||||
"power_cv_pct": 6.244661163316872,
|
||||
"temp_cv_pct": 2.439779963276932,
|
||||
"clock_drift_pct": 0.530345220491747
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.657452543,
|
||||
"samples": 117,
|
||||
"avg_temp_c": 44.623931623931625,
|
||||
"p95_temp_c": 52.19999999999999,
|
||||
"avg_power_w": 40.580256410256354,
|
||||
"p95_power_w": 54.64799999999999,
|
||||
"avg_graphics_clock_mhz": 186.07692307692307,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1643.5641025641025,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 29.666924389599842,
|
||||
"power_cv_pct": 12.772094703863496,
|
||||
"temp_cv_pct": 8.475122734640708,
|
||||
"clock_drift_pct": 12.241118033338953
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 74.41022943110082,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 419.7133534031841
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"variance_too_high",
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 3,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.640129253,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 30.375,
|
||||
"p95_temp_c": 31,
|
||||
"avg_power_w": 34.65437499999999,
|
||||
"p95_power_w": 34.66,
|
||||
"avg_graphics_clock_mhz": 179.5,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 1.0788254446260215,
|
||||
"power_cv_pct": 0.01431502864571969,
|
||||
"temp_cv_pct": 1.5938203070812416,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 517.039084611,
|
||||
"samples": 517,
|
||||
"avg_temp_c": 70.26305609284333,
|
||||
"p95_temp_c": 71,
|
||||
"avg_power_w": 515.7172727272728,
|
||||
"p95_power_w": 522.364,
|
||||
"avg_graphics_clock_mhz": 2422,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.61315280464217,
|
||||
"avg_mem_usage_pct": 39.22437137330754,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 5.764080613784593,
|
||||
"temp_cv_pct": 1.5613533584243726,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.710135838,
|
||||
"samples": 117,
|
||||
"avg_temp_c": 44.58974358974359,
|
||||
"p95_temp_c": 52,
|
||||
"avg_power_w": 39.0471794871795,
|
||||
"p95_power_w": 52.519999999999996,
|
||||
"avg_graphics_clock_mhz": 186.97435897435898,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1643.5641025641025,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 27.466449046011803,
|
||||
"power_cv_pct": 12.490801537100193,
|
||||
"temp_cv_pct": 8.28381511460339,
|
||||
"clock_drift_pct": 13.747521480502309
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 88.47183877243081,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 435.47639817859726
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"normalization_partial"
|
||||
]
|
||||
}
|
||||
],
|
||||
"server_power": {
|
||||
"available": true,
|
||||
"idle_w": 632,
|
||||
"loaded_w": 1942.2352941176468,
|
||||
"delta_w": 1310.2352941176468,
|
||||
"gpu_reported_sum_w": 2087.6722630560935,
|
||||
"reporting_ratio": 0.6276058351226187
|
||||
}
|
||||
}
|
||||
581
gpu-benchmark-20260410-193819/result.json
Executable file
581
gpu-benchmark-20260410-193819/result.json
Executable file
@@ -0,0 +1,581 @@
|
||||
{
|
||||
"benchmark_version": "1",
|
||||
"generated_at": "2026-04-10T19:38:19.724808089Z",
|
||||
"hostname": "debian",
|
||||
"server_model": "G5500 V7",
|
||||
"benchmark_profile": "standard",
|
||||
"parallel_gpus": true,
|
||||
"overall_status": "PARTIAL",
|
||||
"selected_gpu_indices": [
|
||||
0,
|
||||
1,
|
||||
2,
|
||||
3
|
||||
],
|
||||
"findings": [
|
||||
"All 4 GPU(s) passed the benchmark.",
|
||||
"Environment normalization was partial; compare results with caution.",
|
||||
"GPU 0 showed unstable clocks/power over the benchmark window.",
|
||||
"GPU 0 ran without full benchmark normalization.",
|
||||
"GPU 1 showed unstable clocks/power over the benchmark window.",
|
||||
"GPU 1 ran without full benchmark normalization.",
|
||||
"GPU 2 showed unstable clocks/power over the benchmark window.",
|
||||
"GPU 2 ran without full benchmark normalization.",
|
||||
"GPU 3 showed unstable clocks/power over the benchmark window.",
|
||||
"GPU 3 ran without full benchmark normalization."
|
||||
],
|
||||
"warnings": [
|
||||
"gpu inventory query failed: nvidia-smi gpu info (index,uuid,name,pci.bus_id,vbios_version): exit status 2"
|
||||
],
|
||||
"normalization": {
|
||||
"status": "partial",
|
||||
"gpus": [
|
||||
{
|
||||
"index": 0,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 1,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 2,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 3,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
}
|
||||
]
|
||||
},
|
||||
"gpus": [
|
||||
{
|
||||
"index": 0,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.708738197,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 31.5,
|
||||
"p95_temp_c": 32,
|
||||
"avg_power_w": 35.63999999999999,
|
||||
"p95_power_w": 35.64,
|
||||
"avg_graphics_clock_mhz": 180,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 1.9936664864200346e-14,
|
||||
"temp_cv_pct": 1.5873015873015872,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 521.038266969,
|
||||
"samples": 521,
|
||||
"avg_temp_c": 71.51247600767755,
|
||||
"p95_temp_c": 72,
|
||||
"avg_power_w": 521.897197696737,
|
||||
"p95_power_w": 532,
|
||||
"avg_graphics_clock_mhz": 2405.7063339731285,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 98.69481765834932,
|
||||
"avg_mem_usage_pct": 38.351247600767756,
|
||||
"clock_cv_pct": 7.7140057202952,
|
||||
"power_cv_pct": 9.892799596716745,
|
||||
"temp_cv_pct": 2.580458060863098,
|
||||
"clock_drift_pct": 2.6961189099917497
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.171037413,
|
||||
"samples": 116,
|
||||
"avg_temp_c": 44.310344827586206,
|
||||
"p95_temp_c": 51,
|
||||
"avg_power_w": 39.81387931034485,
|
||||
"p95_power_w": 54.0825,
|
||||
"avg_graphics_clock_mhz": 179.6551724137931,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1237.8275862068965,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0.9043546249051633,
|
||||
"power_cv_pct": 10.379008691678044,
|
||||
"temp_cv_pct": 6.727580324493612,
|
||||
"clock_drift_pct": 0.1537279016141304
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 43.96614010540221,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 385.5855710463551
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"variance_too_high",
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 1,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.708738197,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 34,
|
||||
"p95_temp_c": 34,
|
||||
"avg_power_w": 34.82999999999999,
|
||||
"p95_power_w": 34.83,
|
||||
"avg_graphics_clock_mhz": 179.5,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 1.0788254446260215,
|
||||
"power_cv_pct": 2.040030823313524e-14,
|
||||
"temp_cv_pct": 0,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 521.038266969,
|
||||
"samples": 521,
|
||||
"avg_temp_c": 71.71593090211132,
|
||||
"p95_temp_c": 72,
|
||||
"avg_power_w": 518.5774088291746,
|
||||
"p95_power_w": 528.2,
|
||||
"avg_graphics_clock_mhz": 2410.6295585412668,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 98.85220729366603,
|
||||
"avg_mem_usage_pct": 38.35892514395393,
|
||||
"clock_cv_pct": 6.24737613351838,
|
||||
"power_cv_pct": 9.166896001630583,
|
||||
"temp_cv_pct": 2.232861903238498,
|
||||
"clock_drift_pct": 1.8814711300260394
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.171037413,
|
||||
"samples": 116,
|
||||
"avg_temp_c": 45.741379310344826,
|
||||
"p95_temp_c": 52.25,
|
||||
"avg_power_w": 38.606724137931074,
|
||||
"p95_power_w": 52.75,
|
||||
"avg_graphics_clock_mhz": 179.86206896551724,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1446.0344827586207,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0.5789750333796595,
|
||||
"power_cv_pct": 11.580300308869425,
|
||||
"temp_cv_pct": 6.546796049282795,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 52.91376120261324,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 395.6158420178446
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"variance_too_high",
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 2,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.708738197,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 30,
|
||||
"p95_temp_c": 30,
|
||||
"avg_power_w": 35.59374999999999,
|
||||
"p95_power_w": 35.64,
|
||||
"avg_graphics_clock_mhz": 180,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 0.3638624937385677,
|
||||
"temp_cv_pct": 0,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 521.038266969,
|
||||
"samples": 521,
|
||||
"avg_temp_c": 67.8042226487524,
|
||||
"p95_temp_c": 69,
|
||||
"avg_power_w": 511.71065259117063,
|
||||
"p95_power_w": 521.61,
|
||||
"avg_graphics_clock_mhz": 2406.5124760076774,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 98.6852207293666,
|
||||
"avg_mem_usage_pct": 38.618042226487525,
|
||||
"clock_cv_pct": 7.369275290697701,
|
||||
"power_cv_pct": 9.95377772121058,
|
||||
"temp_cv_pct": 2.709178533043663,
|
||||
"clock_drift_pct": 2.5627262910499864
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.171037413,
|
||||
"samples": 116,
|
||||
"avg_temp_c": 41.293103448275865,
|
||||
"p95_temp_c": 47.25,
|
||||
"avg_power_w": 39.30818965517238,
|
||||
"p95_power_w": 52.955,
|
||||
"avg_graphics_clock_mhz": 179.86206896551724,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1237.8275862068965,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0.5789750333796595,
|
||||
"power_cv_pct": 9.84500039444727,
|
||||
"temp_cv_pct": 6.8127582501704795,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 45.48989081268807,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 387.2936934982367
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"variance_too_high",
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 3,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 15.708738197,
|
||||
"samples": 16,
|
||||
"avg_temp_c": 34,
|
||||
"p95_temp_c": 34,
|
||||
"avg_power_w": 35.513124999999995,
|
||||
"p95_power_w": 35.64,
|
||||
"avg_graphics_clock_mhz": 180,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 0.4941532782477418,
|
||||
"temp_cv_pct": 0,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 521.038266969,
|
||||
"samples": 521,
|
||||
"avg_temp_c": 68.54126679462571,
|
||||
"p95_temp_c": 69,
|
||||
"avg_power_w": 509.9767370441462,
|
||||
"p95_power_w": 519.72,
|
||||
"avg_graphics_clock_mhz": 2404.0940499040307,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 98.7447216890595,
|
||||
"avg_mem_usage_pct": 38.42610364683301,
|
||||
"clock_cv_pct": 8.026350243134432,
|
||||
"power_cv_pct": 9.808646251646744,
|
||||
"temp_cv_pct": 2.580108116733557,
|
||||
"clock_drift_pct": 1.5637794268167964
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 120.171037413,
|
||||
"samples": 116,
|
||||
"avg_temp_c": 42.077586206896555,
|
||||
"p95_temp_c": 48.25,
|
||||
"avg_power_w": 38.305517241379285,
|
||||
"p95_power_w": 51.4,
|
||||
"avg_graphics_clock_mhz": 179.79310344827587,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 1341.9310344827586,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0.7062505807258133,
|
||||
"power_cv_pct": 10.343052937274862,
|
||||
"temp_cv_pct": 7.185134807174834,
|
||||
"clock_drift_pct": 0.15349194167306543
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 195.675631386624
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 66.807922688
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 27840,
|
||||
"teraops_per_sec": 298.015759794176
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 560.4993138688001,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 45.149747670535184,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 386.91239350264897
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"variance_too_high",
|
||||
"normalization_partial"
|
||||
]
|
||||
}
|
||||
],
|
||||
"server_power": {
|
||||
"available": true,
|
||||
"idle_w": 670.6666666666666,
|
||||
"loaded_w": 3577.3980582524273,
|
||||
"delta_w": 2906.731391585761,
|
||||
"gpu_reported_sum_w": 2062.161996161228,
|
||||
"reporting_ratio": 1.4095553099110167
|
||||
}
|
||||
}
|
||||
573
gpu-benchmark-20260411-085938/result.json
Executable file
573
gpu-benchmark-20260411-085938/result.json
Executable file
@@ -0,0 +1,573 @@
|
||||
{
|
||||
"benchmark_version": "1",
|
||||
"generated_at": "2026-04-11T08:59:38.567052641Z",
|
||||
"hostname": "debian",
|
||||
"server_model": "G5500 V7",
|
||||
"benchmark_profile": "stability",
|
||||
"overall_status": "PARTIAL",
|
||||
"selected_gpu_indices": [
|
||||
0,
|
||||
1,
|
||||
2,
|
||||
3
|
||||
],
|
||||
"findings": [
|
||||
"All 4 GPU(s) passed the benchmark.",
|
||||
"Environment normalization was partial; compare results with caution.",
|
||||
"GPU 0 ran without full benchmark normalization.",
|
||||
"GPU 1 ran without full benchmark normalization.",
|
||||
"GPU 2 ran without full benchmark normalization.",
|
||||
"GPU 3 ran without full benchmark normalization.",
|
||||
"GPU power reporting may be unreliable: server delta 990 W vs GPU-reported 2084 W (ratio 0.47). GPU telemetry likely over-reports actual consumption."
|
||||
],
|
||||
"warnings": [
|
||||
"gpu inventory query failed: nvidia-smi gpu info (index,uuid,name,pci.bus_id,vbios_version): exit status 2"
|
||||
],
|
||||
"normalization": {
|
||||
"status": "partial",
|
||||
"gpus": [
|
||||
{
|
||||
"index": 0,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 1,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 2,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 3,
|
||||
"persistence_mode": "applied",
|
||||
"gpu_clock_lock_status": "skipped",
|
||||
"notes": [
|
||||
"graphics clock lock skipped: gpu inventory unavailable or MaxGraphicsClockMHz=0"
|
||||
]
|
||||
}
|
||||
]
|
||||
},
|
||||
"gpus": [
|
||||
{
|
||||
"index": 0,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 30.999116342,
|
||||
"samples": 31,
|
||||
"avg_temp_c": 50,
|
||||
"p95_temp_c": 54.5,
|
||||
"avg_power_w": 104.47096774193548,
|
||||
"p95_power_w": 108.61,
|
||||
"avg_graphics_clock_mhz": 2422,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 100,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 2.028975279257823,
|
||||
"temp_cv_pct": 5.003224766539689,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 3652.033401705,
|
||||
"samples": 3652,
|
||||
"avg_temp_c": 70.00602409638554,
|
||||
"p95_temp_c": 70,
|
||||
"avg_power_w": 524.3030010952905,
|
||||
"p95_power_w": 528.23,
|
||||
"avg_graphics_clock_mhz": 2422,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.93729463307777,
|
||||
"avg_mem_usage_pct": 39.491511500547645,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 2.148355726733903,
|
||||
"temp_cv_pct": 0.5358272117706183,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 300.134211129,
|
||||
"samples": 291,
|
||||
"avg_temp_c": 38.807560137457045,
|
||||
"p95_temp_c": 46,
|
||||
"avg_power_w": 38.135498281786944,
|
||||
"p95_power_w": 39.61,
|
||||
"avg_graphics_clock_mhz": 187.59106529209623,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 944.4776632302405,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 64.75534616761331,
|
||||
"power_cv_pct": 9.705769321538293,
|
||||
"temp_cv_pct": 11.481450187501306,
|
||||
"clock_drift_pct": 14.989814023789192
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 197664,
|
||||
"teraops_per_sec": 185.23959771267073
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 197664,
|
||||
"teraops_per_sec": 63.24483347797334
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 197664,
|
||||
"teraops_per_sec": 282.12158593848665
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 530.6060171291307,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 95.70328854653219,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 419.9250918011493
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 1,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 30.024773184,
|
||||
"samples": 30,
|
||||
"avg_temp_c": 49,
|
||||
"p95_temp_c": 49,
|
||||
"avg_power_w": 99.5443333333333,
|
||||
"p95_power_w": 99.59,
|
||||
"avg_graphics_clock_mhz": 2423.3333333333335,
|
||||
"p95_graphics_clock_mhz": 2430,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 100,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0.12302987496560051,
|
||||
"power_cv_pct": 0.08327227979297677,
|
||||
"temp_cv_pct": 0,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 3608.034869542,
|
||||
"samples": 3608,
|
||||
"avg_temp_c": 69.85864745011087,
|
||||
"p95_temp_c": 70,
|
||||
"avg_power_w": 519.3211474501111,
|
||||
"p95_power_w": 523.5,
|
||||
"avg_graphics_clock_mhz": 2422,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.94456762749445,
|
||||
"avg_mem_usage_pct": 38.920731707317074,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 1.9854404455976928,
|
||||
"temp_cv_pct": 0.6438449280694504,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 300.694502766,
|
||||
"samples": 291,
|
||||
"avg_temp_c": 31.02405498281787,
|
||||
"p95_temp_c": 49.5,
|
||||
"avg_power_w": 34.87268041237119,
|
||||
"p95_power_w": 37.97,
|
||||
"avg_graphics_clock_mhz": 182.0996563573883,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 902.979381443299,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 17.117532557949268,
|
||||
"power_cv_pct": 11.261564470591717,
|
||||
"temp_cv_pct": 22.686094189937133,
|
||||
"clock_drift_pct": 4.900448166923811
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 194880,
|
||||
"teraops_per_sec": 182.6305892941824
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 194880,
|
||||
"teraops_per_sec": 62.35406117546666
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 194880,
|
||||
"teraops_per_sec": 278.1480424745643
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 523.1326929442134,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 96.02911910880461,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 414.35155912742727
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 2,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 30.083934487,
|
||||
"samples": 30,
|
||||
"avg_temp_c": 40.06666666666667,
|
||||
"p95_temp_c": 41,
|
||||
"avg_power_w": 104.565,
|
||||
"p95_power_w": 105.1175,
|
||||
"avg_graphics_clock_mhz": 2317.5333333333333,
|
||||
"p95_graphics_clock_mhz": 2321.4,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 100,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0.08610666252680013,
|
||||
"power_cv_pct": 0.309119766163425,
|
||||
"temp_cv_pct": 1.6968450960375328,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 3653.036306358,
|
||||
"samples": 3653,
|
||||
"avg_temp_c": 69.79742677251573,
|
||||
"p95_temp_c": 71,
|
||||
"avg_power_w": 521.0794552422657,
|
||||
"p95_power_w": 525.36,
|
||||
"avg_graphics_clock_mhz": 2422,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.9452504790583,
|
||||
"avg_mem_usage_pct": 39.54913769504517,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 1.9968664278288677,
|
||||
"temp_cv_pct": 0.9113538767500047,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 300.206414655,
|
||||
"samples": 290,
|
||||
"avg_temp_c": 38.644827586206894,
|
||||
"p95_temp_c": 48,
|
||||
"avg_power_w": 38.240275862069,
|
||||
"p95_power_w": 39.6455,
|
||||
"avg_graphics_clock_mhz": 182.5448275862069,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 946.3379310344827,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 17.07777076535198,
|
||||
"power_cv_pct": 9.812483217019517,
|
||||
"temp_cv_pct": 12.52523069358715,
|
||||
"clock_drift_pct": 5.779589459892267
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 197648,
|
||||
"teraops_per_sec": 185.22460341141502
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 197648,
|
||||
"teraops_per_sec": 63.239714096924445
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 197648,
|
||||
"teraops_per_sec": 282.09874948179737
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 530.5630669901368,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 96.00626714434226,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 420.21259928683537
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"normalization_partial"
|
||||
]
|
||||
},
|
||||
{
|
||||
"index": 3,
|
||||
"compute_capability": "12.0",
|
||||
"backend": "cublasLt",
|
||||
"status": "OK",
|
||||
"baseline": {
|
||||
"duration_sec": 30.126177597,
|
||||
"samples": 30,
|
||||
"avg_temp_c": 46.7,
|
||||
"p95_temp_c": 47,
|
||||
"avg_power_w": 98.56633333333333,
|
||||
"p95_power_w": 98.83,
|
||||
"avg_graphics_clock_mhz": 2422,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 100,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 0.18649396425550566,
|
||||
"temp_cv_pct": 0.9812795920676312,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"steady": {
|
||||
"duration_sec": 3603.039321222,
|
||||
"samples": 3603,
|
||||
"avg_temp_c": 69.96364140993616,
|
||||
"p95_temp_c": 71,
|
||||
"avg_power_w": 518.9227643630296,
|
||||
"p95_power_w": 523.27,
|
||||
"avg_graphics_clock_mhz": 2422,
|
||||
"p95_graphics_clock_mhz": 2422,
|
||||
"avg_memory_clock_mhz": 12481,
|
||||
"p95_memory_clock_mhz": 12481,
|
||||
"avg_usage_pct": 99.93422148209825,
|
||||
"avg_mem_usage_pct": 39.586455731335,
|
||||
"clock_cv_pct": 0,
|
||||
"power_cv_pct": 2.281713247433057,
|
||||
"temp_cv_pct": 1.1128723340072593,
|
||||
"clock_drift_pct": 0
|
||||
},
|
||||
"cooldown": {
|
||||
"duration_sec": 300.670868947,
|
||||
"samples": 290,
|
||||
"avg_temp_c": 38.148275862068964,
|
||||
"p95_temp_c": 47,
|
||||
"avg_power_w": 38.17251724137949,
|
||||
"p95_power_w": 39.61,
|
||||
"avg_graphics_clock_mhz": 189.0103448275862,
|
||||
"p95_graphics_clock_mhz": 180,
|
||||
"avg_memory_clock_mhz": 946.3379310344827,
|
||||
"p95_memory_clock_mhz": 405,
|
||||
"avg_usage_pct": 0,
|
||||
"avg_mem_usage_pct": 0,
|
||||
"clock_cv_pct": 70.2162030341821,
|
||||
"power_cv_pct": 10.027005094761156,
|
||||
"temp_cv_pct": 12.51736757591107,
|
||||
"clock_drift_pct": 17.23078891803699
|
||||
},
|
||||
"throttle_counters": {
|
||||
"sw_power_cap_us": 0,
|
||||
"sw_thermal_slowdown_us": 0,
|
||||
"sync_boost_us": 0,
|
||||
"hw_thermal_slowdown_us": 0,
|
||||
"hw_power_brake_slowdown_us": 0
|
||||
},
|
||||
"precision_results": [
|
||||
{
|
||||
"name": "fp16_tensor",
|
||||
"category": "fp16_bf16",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 11904,
|
||||
"n": 11904,
|
||||
"k": 11904,
|
||||
"iterations": 194896,
|
||||
"teraops_per_sec": 182.6455835954381
|
||||
},
|
||||
{
|
||||
"name": "fp32_tf32",
|
||||
"category": "fp32_tf32",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 8320,
|
||||
"n": 8320,
|
||||
"k": 8320,
|
||||
"iterations": 194896,
|
||||
"teraops_per_sec": 62.359180556515554
|
||||
},
|
||||
{
|
||||
"name": "fp64",
|
||||
"category": "fp64",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
},
|
||||
{
|
||||
"name": "fp8_e4m3",
|
||||
"category": "fp8",
|
||||
"supported": true,
|
||||
"lanes": 16,
|
||||
"m": 13696,
|
||||
"n": 13696,
|
||||
"k": 13696,
|
||||
"iterations": 194896,
|
||||
"teraops_per_sec": 278.17087893125347
|
||||
},
|
||||
{
|
||||
"name": "fp8_e5m2",
|
||||
"category": "fp8",
|
||||
"supported": false,
|
||||
"notes": "unsupported"
|
||||
}
|
||||
],
|
||||
"scores": {
|
||||
"compute_score": 523.1756430832071,
|
||||
"power_sustain_score": 0,
|
||||
"thermal_sustain_score": 100,
|
||||
"stability_score": 95.43657350513388,
|
||||
"interconnect_score": 0,
|
||||
"composite_score": 413.76556728433667
|
||||
},
|
||||
"degradation_reasons": [
|
||||
"normalization_partial"
|
||||
]
|
||||
}
|
||||
],
|
||||
"server_power": {
|
||||
"available": true,
|
||||
"idle_w": 936,
|
||||
"loaded_w": 1925.6498918250659,
|
||||
"delta_w": 989.6498918250659,
|
||||
"gpu_reported_sum_w": 2083.626368150697,
|
||||
"reporting_ratio": 0.47496514104081927
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user