诊断项未通过时返回的JSON示例
带宽诊断
带宽诊断不通过时,返回的JSON文件回显如下:
{
"DiagnosisItems": [
{
"group_name": "Hardware",
"group_results": "FAIL",
"sub_items": [
{
"item_info": [
"d2d bandwidth diagnosis failed on device 0 with bandwidth 751.0634765625 / 4999",
"d2h bandwidth diagnosis failed on device 0 with bandwidth 28.201079722538424 / 30",
"h2d bandwidth diagnosis failed on device 0 with bandwidth 25.111515452819699 / 40",
"p2p unidirectional bandwidth diagnosis failed from device 0 to device 1 with bandwidth 26.207678676901633 / 50",
"p2p bidirectional bandwidth diagnosis failed from device 0 to device 1 with bandwidth 50.990615028778471 / 90"
],
"item_info_element": [
{
"device_id": "0",
"threshold_info": [
{
"actual_value": "751.0634765625",
"expected_status": "The value must be greater than 4999",
"test_item": "d2d"
},
{
"actual_value": "28.201079722538424",
"expected_status": "The value must be greater than 30",
"test_item": "d2h"
},
{
"actual_value": "25.111515452819699",
"expected_status": "The value must be greater than 40",
"test_item": "h2d"
},
{
"actual_value": "26.207678676901633",
"detail_info": [
{
"key": "dst_device_id",
"value": "1"
}
],
"expected_status": "The value must be greater than 50",
"test_item": "p2p unidirectional"
},
{
"actual_value": "50.990615028778471",
"detail_info": [
{
"key": "dst_device_id",
"value": "1"
}
],
"expected_status": "The value must be greater than 90",
"test_item": "p2p bidirectional"
}
],
"type": "bandwidth"
}
],
"item_name": "bandwidth",
"item_result": "FAIL"
}
]
}
],
"Summary": {
"Arch": "aarch64",
"Mode": "******",
"Time": "20241104-03:55:27"
}
}
算力诊断
算力诊断不通过时,返回的JSON文件回显如下:
{
"DiagnosisItems": [
{
"group_name": "Hardware",
"group_results": "FAIL",
"sub_items": [
{
"item_info": [
"Check AI flops failed on device 0 with flops 315.199005 / 600",
"Temperature Warned on device 0 with 40 / 10"
],
"item_info_element": [
{
"device_id": "0",
"threshold_info": [
{
"actual_value": "315.199005",
"expected_status": "The value must be greater than 600",
"test_item": "flops"
},
{
"actual_value": "40",
"expected_status": "The value must be greater than 10",
"test_item": "temperature"
}
],
"type": "aiflops"
}
],
"item_name": "aiflops",
"item_result": "FAIL"
}
]
}
],
"Summary": {
"Arch": "aarch64",
"Mode": "******",
"Time": "20241108-04:00:29"
}
}
眼图诊断
眼图诊断不通过时,返回的JSON文件回显如下:
{
"DiagnosisItems": [
{
"group_name": "Hardware",
"group_results": "IMPORTANT_WARN",
"sub_items": [
{
"item_name": "signalQuality",
"item_result": "IMPORTANT_WARN",
"result_array": [
{
"item_info": [
"Hccs signal quality abnormal, srcDevice 0, macro 2, lane: 0, dstDevice: 1, snr: 633378, heh: 386",
"Roce signal quality abnormal, device 0, macro 0, lane: 0, snr: 594869, heh: 382",
"pcie signal quality is abnormal on device 0",
"pcie signal quality is abnormal on device 1"
],
"item_info_element": [
{
"device_id": "0",
"threshold_info": [
{
"actual_value": "633378",
"detail_info": [
{
"key": "macro",
"value": "2"
},
{
"key": "lane",
"value": "0"
},
{
"key": "dst_device_id",
"value": "1"
}
],
"expected_status": "The value must be greater than 800000",
"test_item": "snr"
},
{
"actual_value": "386",
"detail_info": [
{
"key": "macro",
"value": "2"
},
{
"key": "lane",
"value": "0"
},
{
"key": "dst_device_id",
"value": "1"
}
],
"expected_status": "The value must be greater than 750",
"test_item": "heh"
}
],
"type": "signal quality hccs"
},
{
"device_id": "0",
"threshold_info": [
{
"actual_value": "-69",
"detail_info": [
{
"key": "macro",
"value": "9"
},
{
"key": "lane",
"value": "0"
}
],
"expected_status": "The value must be less than 170",
"test_item": "bottom"
},
{
"actual_value": "70",
"detail_info": [
{
"key": "macro",
"value": "9"
},
{
"key": "lane",
"value": "0"
}
],
"expected_status": "The value must be greater than 170",
"test_item": "top"
},
{
"actual_value": "-75",
"detail_info": [
{
"key": "macro",
"value": "9"
},
{
"key": "lane",
"value": "1"
}
],
"expected_status": "The value must be less than 170",
"test_item": "bottom"
},
{
"actual_value": "69",
"detail_info": [
{
"key": "macro",
"value": "9"
},
{
"key": "lane",
"value": "1"
}
],
"expected_status": "The value must be greater than 170",
"test_item": "top"
}
],
"type": "signal quality pcie"
},
{
"device_id": "0",
"threshold_info": [
{
"actual_value": "594869",
"detail_info": [
{
"key": "macro",
"value": "0"
},
{
"key": "lane",
"value": "0"
}
],
"expected_status": "The value must be greater than 800000",
"test_item": "snr"
},
{
"actual_value": "382",
"detail_info": [
{
"key": "macro",
"value": "0"
},
{
"key": "lane",
"value": "0"
}
],
"expected_status": "The value must be greater than 750",
"test_item": "heh"
}
],
"type": "signal quality roce"
}
],
"item_result": "IMPORTANT_WARN"
}
]
}
]
}
],
"Summary": {
"Arch": "aarch64",
"Mode": "******",
"Time": "20241104-06:18:45"
}
}
PRBS码流诊断
PRBS码流诊断不通过时,返回的JSON文件回显如下:
{
"DiagnosisItems": [
{
"group_name": "Hardware",
"group_results": "IMPORTANT_WARN",
"sub_items": [
{
"item_name": "prbs",
"item_result": "IMPORTANT_WARN",
"result_array": [
{
"item_info": [
"lane: 0, error count: 60000000, error rate: 0.0420698359%, alos: 0 on device 0"
],
"item_info_element": [
{
"device_id": "0",
"threshold_info": [
{
"actual_value": "0.0004206984",
"detail_info": [
{
"key": "lane",
"value": "0"
}
],
"expected_status": "The value must be less than 1e-05",
"test_item": "error rate"
}
],
"type": "prbs"
}
],
"item_result": "IMPORTANT_WARN"
}
]
}
]
}
],
"Summary": {
"Arch": "aarch64",
"Mode": "******",
"Time": "20241104-22:35:36"
}
}
NIC诊断
NIC诊断不通过时,返回的JSON文件回显如下:
{
"DiagnosisItems": [
{
"group_name": "Hardware",
"group_results": "GENERAL_WARN",
"sub_items": [
{
"item_name": "nic",
"item_result": "GENERAL_WARN",
"nic_result_array": [
{
"item_info": [
"not connected between device 0 and device 1."
],
"item_result": "GENERAL_WARN"
}
]
}
]
}
],
"Summary": {
"Arch": "aarch64",
"Mode": "******",
"Time": "20250305-17:20:02"
}
}
父主题: 参考信息