诊断项未通过时返回的JSON示例
带宽诊断
带宽诊断不通过时,返回的JSON文件回显如下:
{ "DiagnosisItems": [ { "group_name": "Hardware", "group_results": "FAIL", "sub_items": [ { "item_info": [ "d2d bandwidth diagnosis failed on device 0 with bandwidth 751.0634765625 / 4999", "d2h bandwidth diagnosis failed on device 0 with bandwidth 28.201079722538424 / 30", "h2d bandwidth diagnosis failed on device 0 with bandwidth 25.111515452819699 / 40", "p2p unidirectional bandwidth diagnosis failed from device 0 to device 1 with bandwidth 26.207678676901633 / 50", "p2p bidirectional bandwidth diagnosis failed from device 0 to device 1 with bandwidth 50.990615028778471 / 90" ], "item_info_element": [ { "device_id": "0", "threshold_info": [ { "actual_value": "751.0634765625", "expected_status": "The value must be greater than 4999", "test_item": "d2d" }, { "actual_value": "28.201079722538424", "expected_status": "The value must be greater than 30", "test_item": "d2h" }, { "actual_value": "25.111515452819699", "expected_status": "The value must be greater than 40", "test_item": "h2d" }, { "actual_value": "26.207678676901633", "detail_info": [ { "key": "dst_device_id", "value": "1" } ], "expected_status": "The value must be greater than 50", "test_item": "p2p unidirectional" }, { "actual_value": "50.990615028778471", "detail_info": [ { "key": "dst_device_id", "value": "1" } ], "expected_status": "The value must be greater than 90", "test_item": "p2p bidirectional" } ], "type": "bandwidth" } ], "item_name": "bandwidth", "item_result": "FAIL" } ] } ], "Summary": { "Arch": "aarch64", "Mode": "******", "Time": "20241104-03:55:27" } }
算力诊断
算力诊断不通过时,返回的JSON文件回显如下:
{ "DiagnosisItems": [ { "group_name": "Hardware", "group_results": "FAIL", "sub_items": [ { "item_info": [ "Check AI flops failed on device 0 with flops 315.199005 / 600", "Temperature Warned on device 0 with 40 / 10" ], "item_info_element": [ { "device_id": "0", "threshold_info": [ { "actual_value": "315.199005", "expected_status": "The value must be greater than 600", "test_item": "flops" }, { "actual_value": "40", "expected_status": "The value must be greater than 10", "test_item": "temperature" } ], "type": "aiflops" } ], "item_name": "aiflops", "item_result": "FAIL" } ] } ], "Summary": { "Arch": "aarch64", "Mode": "******", "Time": "20241108-04:00:29" } }
眼图诊断
眼图诊断不通过时,返回的JSON文件回显如下:
{ "DiagnosisItems": [ { "group_name": "Hardware", "group_results": "IMPORTANT_WARN", "sub_items": [ { "item_name": "signalQuality", "item_result": "IMPORTANT_WARN", "result_array": [ { "item_info": [ "Hccs signal quality abnormal, srcDevice 0, macro 2, lane: 0, dstDevice: 1, snr: 633378, heh: 386", "Roce signal quality abnormal, device 0, macro 0, lane: 0, snr: 594869, heh: 382", "pcie signal quality is abnormal on device 0", "pcie signal quality is abnormal on device 1" ], "item_info_element": [ { "device_id": "0", "threshold_info": [ { "actual_value": "633378", "detail_info": [ { "key": "macro", "value": "2" }, { "key": "lane", "value": "0" }, { "key": "dst_device_id", "value": "1" } ], "expected_status": "The value must be greater than 800000", "test_item": "snr" }, { "actual_value": "386", "detail_info": [ { "key": "macro", "value": "2" }, { "key": "lane", "value": "0" }, { "key": "dst_device_id", "value": "1" } ], "expected_status": "The value must be greater than 750", "test_item": "heh" } ], "type": "signal quality hccs" }, { "device_id": "0", "threshold_info": [ { "actual_value": "-69", "detail_info": [ { "key": "macro", "value": "9" }, { "key": "lane", "value": "0" } ], "expected_status": "The value must be less than 170", "test_item": "bottom" }, { "actual_value": "70", "detail_info": [ { "key": "macro", "value": "9" }, { "key": "lane", "value": "0" } ], "expected_status": "The value must be greater than 170", "test_item": "top" }, { "actual_value": "-75", "detail_info": [ { "key": "macro", "value": "9" }, { "key": "lane", "value": "1" } ], "expected_status": "The value must be less than 170", "test_item": "bottom" }, { "actual_value": "69", "detail_info": [ { "key": "macro", "value": "9" }, { "key": "lane", "value": "1" } ], "expected_status": "The value must be greater than 170", "test_item": "top" } ], "type": "signal quality pcie" }, { "device_id": "0", "threshold_info": [ { "actual_value": "594869", "detail_info": [ { "key": "macro", "value": "0" }, { "key": "lane", "value": "0" } ], "expected_status": "The value must be greater than 800000", "test_item": "snr" }, { "actual_value": "382", "detail_info": [ { "key": "macro", "value": "0" }, { "key": "lane", "value": "0" } ], "expected_status": "The value must be greater than 750", "test_item": "heh" } ], "type": "signal quality roce" } ], "item_result": "IMPORTANT_WARN" } ] } ] } ], "Summary": { "Arch": "aarch64", "Mode": "******", "Time": "20241104-06:18:45" } }
PRBS码流诊断
PRBS码流诊断不通过时,返回的JSON文件回显如下:
{ "DiagnosisItems": [ { "group_name": "Hardware", "group_results": "IMPORTANT_WARN", "sub_items": [ { "item_name": "prbs", "item_result": "IMPORTANT_WARN", "result_array": [ { "item_info": [ "lane: 0, error count: 60000000, error rate: 0.0420698359%, alos: 0 on device 0" ], "item_info_element": [ { "device_id": "0", "threshold_info": [ { "actual_value": "0.0004206984", "detail_info": [ { "key": "lane", "value": "0" } ], "expected_status": "The value must be less than 1e-05", "test_item": "error rate" } ], "type": "prbs" } ], "item_result": "IMPORTANT_WARN" } ] } ] } ], "Summary": { "Arch": "aarch64", "Mode": "******", "Time": "20241104-22:35:36" } }
NIC诊断
NIC诊断不通过时,返回的JSON文件回显如下:
{ "DiagnosisItems": [ { "group_name": "Hardware", "group_results": "GENERAL_WARN", "sub_items": [ { "item_name": "nic", "item_result": "GENERAL_WARN", "nic_result_array": [ { "item_info": [ "not connected between device 0 and device 1." ], "item_result": "GENERAL_WARN" } ] } ] } ], "Summary": { "Arch": "aarch64", "Mode": "******", "Time": "20250305-17:20:02" } }
父主题: 参考信息