[
  {
    "50.00 percentile latency (ns)": 48120510,
    "90.00 percentile latency (ns)": 68597056,
    "95.00 percentile latency (ns)": 75848626,
    "97.00 percentile latency (ns)": 79450547,
    "99.00 percentile latency (ns)": 84819181,
    "99.90 percentile latency (ns)": 92055737,
    "Completed samples per second": 8070.84,
    "Max latency (ns)": 101756572,
    "Mean latency (ns)": 48988919,
    "Min duration satisfied": "Yes",
    "Min latency (ns)": 16668340,
    "Min queries satisfied": "Yes",
    "Mode": "PerformanceOnly",
    "Performance constraints satisfied": "Yes",
    "Result is": "VALID",
    "SUT name": "LWIS_Server",
    "Scenario": "server",
    "Scheduled samples per second": 8071.37,
    "accelerator_frequency": "",
    "accelerator_host_interconnect": "",
    "accelerator_interconnect": "",
    "accelerator_interconnect_topology": "",
    "accelerator_memory_capacity": "80 GB",
    "accelerator_memory_configuration": "",
    "accelerator_model_name": "NVIDIA A100-SXM-80GB",
    "accelerator_on-chip_memories": "",
    "accelerators_per_node": 8,
    "accuracy_log_probability": 0,
    "accuracy_log_rng_seed": 0,
    "accuracy_log_sampling_target": 0,
    "boot_firmware_version": "",
    "characteristics.mAP": 20.112,
    "characteristics.scheduled_queries_per_second": 8071.37,
    "characteristics.scheduled_queries_per_second.normalized_per_core": 1008.92125,
    "characteristics.scheduled_queries_per_second.normalized_per_processor": 1008.92125,
    "ck_system": "NF5488A5_A100-SXM-80GBx8_TRT",
    "ck_used": false,
    "cooling": "Liquid",
    "dataset": "COCO 2017 (300x300)",
    "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/coco2017.md",
    "dim_x_default": "characteristics.scheduled_queries_per_second",
    "dim_y_default": "characteristics.mAP",
    "dim_y_maximize": true,
    "disk_controllers": "",
    "disk_drives": "",
    "division": "closed",
    "filesystem": "",
    "formal_model": "ssd-mobilenet",
    "formal_model_accuracy": 99.0,
    "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package",
    "framework": "TensorRT 8.0.1, CUDA 11.3",
    "host_memory_capacity": "2 TB",
    "host_memory_configuration": "",
    "host_networking": "",
    "host_networking_topology": "",
    "host_processor_caches": "",
    "host_processor_core_count": 64,
    "host_processor_frequency": "",
    "host_processor_interconnect": "",
    "host_processor_model_name": "AMD EPYC 7742",
    "host_processors_per_node": 2,
    "host_storage_capacity": "11.7 TB + 448GB*2",
    "host_storage_type": "NVMe SSD + M.2",
    "hw_notes": "NVIDIA A100-SXM-80GB-500W",
    "informal_model": "ssd-resnet34",
    "input_data_types": "int8",
    "key.accuracy": "characteristics.mAP",
    "management_firmware_version": "",
    "max_async_queries": 0,
    "max_duration (ms)": 0,
    "max_query_count": 0,
    "min_duration (ms)": 600000,
    "min_query_count": 270336,
    "mlperf_version": 1.1,
    "network_speed_mbit": "",
    "nics_enabled_connected": "",
    "nics_enabled_firmware": "",
    "nics_enabled_os": "",
    "normalize_cores": 8,
    "normalize_processors": 8,
    "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Inspur/code",
    "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Inspur/results/NF5488A5_A100-SXM-80GBx8_TRT",
    "number_of_nodes": 1,
    "number_of_type_nics_installed": "",
    "operating_system": "Ubuntu 20.04.2",
    "other_hardware": "",
    "other_software_stack": "TensorRT 8.0.1, CUDA 11.3, cuDNN 8.2.1, Driver 470.57.02, DALI 0.31.0",
    "performance_issue_same": 0,
    "performance_issue_same_index": 0,
    "performance_issue_unique": 0,
    "performance_sample_count": 64,
    "power_management": "",
    "power_supply_details": "",
    "power_supply_quantity_and_rating_watts": "",
    "print_timestamps": 0,
    "problem": false,
    "qsl_rng_seed": 1624344308455410291,
    "retraining": "N",
    "sample_index_rng_seed": 517984244576520566,
    "samples_per_query": 1,
    "schedule_rng_seed": 10051496985653635065,
    "starting_weights_filename": "resnet34-ssd1200.pytorch",
    "status": "available",
    "submitter": "Inspur",
    "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Inspur",
    "sw_notes": "",
    "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/NF5488A5_A100-SXM-80GBx8_TRT",
    "system_name": "NF5488A5 (8x A100-SXM-80GB, TensorRT)",
    "system_type": "datacenter",
    "target_latency (ns)": 100000000,
    "target_qps": 8070,
    "task": "object detection",
    "task2": "object detection",
    "total_cores": 128,
    "uid": "cdaae669f92abde8",
    "use_accelerator": true,
    "weight_data_types": "int8",
    "weight_transformations": "quantization, affine fusion"
  },
  {
    "50.00 percentile latency (ns)": 33060402,
    "90.00 percentile latency (ns)": 58475265,
    "95.00 percentile latency (ns)": 65190296,
    "97.00 percentile latency (ns)": 72027755,
    "99.00 percentile latency (ns)": 81996120,
    "99.90 percentile latency (ns)": 98783869,
    "Completed samples per second": 7764.13,
    "Max latency (ns)": 114247173,
    "Mean latency (ns)": 36789958,
    "Min duration satisfied": "Yes",
    "Min latency (ns)": 16717624,
    "Min queries satisfied": "Yes",
    "Mode": "PerformanceOnly",
    "Performance constraints satisfied": "Yes",
    "Result is": "VALID",
    "SUT name": "LWIS_Server",
    "Scenario": "server",
    "Scheduled samples per second": 7764.69,
    "accelerator_frequency": "",
    "accelerator_host_interconnect": "",
    "accelerator_interconnect": "",
    "accelerator_interconnect_topology": "",
    "accelerator_memory_capacity": "40GB",
    "accelerator_memory_configuration": "HBM2",
    "accelerator_model_name": "NVIDIA A100-SXM4-40GB",
    "accelerator_on-chip_memories": "",
    "accelerators_per_node": 8,
    "accuracy_log_probability": 0,
    "accuracy_log_rng_seed": 0,
    "accuracy_log_sampling_target": 0,
    "characteristics.mAP": 20.111,
    "characteristics.scheduled_queries_per_second": 7764.69,
    "characteristics.scheduled_queries_per_second.normalized_per_core": 970.58625,
    "characteristics.scheduled_queries_per_second.normalized_per_processor": 970.58625,
    "ck_system": "NF5488M6_A100-SXM4-40GBx8_TRT",
    "ck_used": true,
    "cooling": "",
    "dataset": "COCO 2017 (300x300)",
    "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/coco2017.md",
    "dim_x_default": "characteristics.scheduled_queries_per_second",
    "dim_y_default": "characteristics.mAP",
    "dim_y_maximize": true,
    "division": "closed",
    "formal_model": "ssd-mobilenet",
    "formal_model_accuracy": 99.0,
    "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package",
    "framework": "TensorRT 7.2, CUDA 11.2",
    "host_memory_capacity": "1 TB",
    "host_memory_configuration": "",
    "host_networking": "",
    "host_networking_topology": "",
    "host_processor_caches": "",
    "host_processor_core_count": 120,
    "host_processor_frequency": "",
    "host_processor_interconnect": "",
    "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor",
    "host_processors_per_node": 2,
    "host_storage_capacity": "15 TB",
    "host_storage_type": "NVMe SSD",
    "hw_notes": "",
    "informal_model": "ssd-resnet34",
    "input_data_types": "int8",
    "key.accuracy": "characteristics.mAP",
    "max_async_queries": 0,
    "max_duration (ms)": 0,
    "max_query_count": 0,
    "min_duration (ms)": 600000,
    "min_query_count": 270336,
    "mlperf_version": 1.0,
    "normalize_cores": 8,
    "normalize_processors": 8,
    "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/code",
    "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/results/NF5488M6_A100-SXM4-40GBx8_TRT",
    "number_of_nodes": 1,
    "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)",
    "other_software_stack": "TensorRT 7.2, CUDA 11.2, cuDNN 8.0.2, DALI 0.25.0; GCC 7.5.0; Python 3.7.10",
    "performance_issue_same": 0,
    "performance_issue_same_index": 0,
    "performance_issue_unique": 0,
    "performance_sample_count": 64,
    "print_timestamps": 0,
    "problem": false,
    "qsl_rng_seed": 7322528924094909334,
    "retraining": "N",
    "sample_index_rng_seed": 1570999273408051088,
    "samples_per_query": 1,
    "schedule_rng_seed": 3507442325620259414,
    "starting_weights_filename": "resnet34-ssd1200.pytorch",
    "status": "Preview",
    "submitter": "Inspur",
    "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Inspur",
    "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)",
    "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/NF5488M6_A100-SXM4-40GBx8_TRT",
    "system_name": "Microsoft Corporation 7.0 (Virtual Machine)",
    "system_type": "datacenter",
    "target_latency (ns)": 100000000,
    "target_qps": 7760,
    "task": "object detection",
    "task2": "object detection",
    "total_cores": 240,
    "uid": "baa16a51a26aa227",
    "use_accelerator": true,
    "weight_data_types": "int8",
    "weight_transformations": "quantization, affine fusion"
  },
  {
    "50.00 percentile latency (ns)": 41192459,
    "90.00 percentile latency (ns)": 58031268,
    "95.00 percentile latency (ns)": 63042020,
    "97.00 percentile latency (ns)": 66232690,
    "99.00 percentile latency (ns)": 73872638,
    "99.90 percentile latency (ns)": 83339097,
    "Completed samples per second": 8054.02,
    "Max latency (ns)": 90885032,
    "Mean latency (ns)": 41509429,
    "Min duration satisfied": "Yes",
    "Min latency (ns)": 16566866,
    "Min queries satisfied": "Yes",
    "Mode": "PerformanceOnly",
    "Performance constraints satisfied": "Yes",
    "Result is": "VALID",
    "SUT name": "LWIS_Server",
    "Scenario": "server",
    "Scheduled samples per second": 8054.45,
    "accelerator_frequency": "",
    "accelerator_host_interconnect": "",
    "accelerator_interconnect": "",
    "accelerator_interconnect_topology": "",
    "accelerator_memory_capacity": "80GB",
    "accelerator_memory_configuration": "HBM2",
    "accelerator_model_name": "NVIDIA A100-SXM-80GB",
    "accelerator_on-chip_memories": "",
    "accelerators_per_node": 8,
    "accuracy_log_probability": 0,
    "accuracy_log_rng_seed": 0,
    "accuracy_log_sampling_target": 0,
    "characteristics.mAP": 20.111,
    "characteristics.scheduled_queries_per_second": 8054.45,
    "characteristics.scheduled_queries_per_second.normalized_per_core": 1006.80625,
    "characteristics.scheduled_queries_per_second.normalized_per_processor": 1006.80625,
    "ck_system": "NF5488A5_LIQUID_A100-SXM-80GBx8_TRT",
    "ck_used": false,
    "cooling": "Liquid",
    "dataset": "COCO 2017 (300x300)",
    "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/coco2017.md",
    "dim_x_default": "characteristics.scheduled_queries_per_second",
    "dim_y_default": "characteristics.mAP",
    "dim_y_maximize": true,
    "division": "closed",
    "formal_model": "ssd-mobilenet",
    "formal_model_accuracy": 99.0,
    "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package",
    "framework": "TensorRT 7.2, CUDA 11.2",
    "host_memory_capacity": "1 TB",
    "host_memory_configuration": "",
    "host_networking": "",
    "host_networking_topology": "",
    "host_processor_caches": "",
    "host_processor_core_count": 64,
    "host_processor_frequency": "",
    "host_processor_interconnect": "",
    "host_processor_model_name": "AMD EPYC 7742",
    "host_processors_per_node": 2,
    "host_storage_capacity": "15 TB",
    "host_storage_type": "NVMe SSD",
    "hw_notes": "",
    "informal_model": "ssd-resnet34",
    "input_data_types": "int8",
    "key.accuracy": "characteristics.mAP",
    "max_async_queries": 0,
    "max_duration (ms)": 0,
    "max_query_count": 0,
    "min_duration (ms)": 600000,
    "min_query_count": 270336,
    "mlperf_version": 1.0,
    "normalize_cores": 8,
    "normalize_processors": 8,
    "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/code",
    "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/results/NF5488A5_LIQUID_A100-SXM-80GBx8_TRT",
    "number_of_nodes": 1,
    "operating_system": "Ubuntu 18.04.2",
    "other_software_stack": "TensorRT 7.2, CUDA 11.2, cuDNN 8.0.2, DALI 0.25.0, Triton 20.09",
    "performance_issue_same": 0,
    "performance_issue_same_index": 0,
    "performance_issue_unique": 0,
    "performance_sample_count": 64,
    "print_timestamps": 0,
    "problem": false,
    "qsl_rng_seed": 7322528924094909334,
    "retraining": "N",
    "sample_index_rng_seed": 1570999273408051088,
    "samples_per_query": 1,
    "schedule_rng_seed": 3507442325620259414,
    "starting_weights_filename": "resnet34-ssd1200.pytorch",
    "status": "Preview",
    "submitter": "Inspur",
    "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Inspur",
    "sw_notes": "",
    "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/NF5488A5_LIQUID_A100-SXM-80GBx8_TRT",
    "system_name": "NF5488A5 (Liquid cooling)",
    "system_type": "datacenter",
    "target_latency (ns)": 100000000,
    "target_qps": 8050,
    "task": "object detection",
    "task2": "object detection",
    "total_cores": 128,
    "uid": "17b34f140c495280",
    "use_accelerator": true,
    "weight_data_types": "int8",
    "weight_transformations": "quantization, affine fusion"
  },
  {
    "50.00 percentile latency (ns)": 35060928,
    "90.00 percentile latency (ns)": 56733440,
    "95.00 percentile latency (ns)": 62876345,
    "97.00 percentile latency (ns)": 66655276,
    "99.00 percentile latency (ns)": 73544980,
    "99.90 percentile latency (ns)": 86065354,
    "Completed samples per second": 6501.0,
    "Max latency (ns)": 97825208,
    "Mean latency (ns)": 38236987,
    "Min duration satisfied": "Yes",
    "Min latency (ns)": 16955325,
    "Min queries satisfied": "Yes",
    "Mode": "PerformanceOnly",
    "Performance constraints satisfied": "Yes",
    "Result is": "VALID",
    "SUT name": "LWIS_Server",
    "Scenario": "server",
    "Scheduled samples per second": 6501.45,
    "accelerator_frequency": "",
    "accelerator_host_interconnect": "",
    "accelerator_interconnect": "",
    "accelerator_interconnect_topology": "",
    "accelerator_memory_capacity": "40GB",
    "accelerator_memory_configuration": "HBM2",
    "accelerator_model_name": "NVIDIA A100-PCIe",
    "accelerator_on-chip_memories": "",
    "accelerators_per_node": 8,
    "accuracy_log_probability": 0,
    "accuracy_log_rng_seed": 0,
    "accuracy_log_sampling_target": 0,
    "characteristics.mAP": 20.111,
    "characteristics.scheduled_queries_per_second": 6501.45,
    "characteristics.scheduled_queries_per_second.normalized_per_core": 812.68125,
    "characteristics.scheduled_queries_per_second.normalized_per_processor": 812.68125,
    "ck_system": "NF5468M6_A100-PCIex8_TRT",
    "ck_used": true,
    "cooling": "",
    "dataset": "COCO 2017 (300x300)",
    "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/coco2017.md",
    "dim_x_default": "characteristics.scheduled_queries_per_second",
    "dim_y_default": "characteristics.mAP",
    "dim_y_maximize": true,
    "division": "closed",
    "formal_model": "ssd-mobilenet",
    "formal_model_accuracy": 99.0,
    "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package",
    "framework": "TensorRT 7.2, CUDA 11.1",
    "host_memory_capacity": "2 TB",
    "host_memory_configuration": "",
    "host_networking": "",
    "host_networking_topology": "",
    "host_processor_caches": "",
    "host_processor_core_count": 120,
    "host_processor_frequency": "",
    "host_processor_interconnect": "",
    "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor",
    "host_processors_per_node": 2,
    "host_storage_capacity": "15 TB",
    "host_storage_type": "NVMe SSD",
    "hw_notes": "",
    "informal_model": "ssd-resnet34",
    "input_data_types": "int8",
    "key.accuracy": "characteristics.mAP",
    "max_async_queries": 0,
    "max_duration (ms)": 0,
    "max_query_count": 0,
    "min_duration (ms)": 600000,
    "min_query_count": 270336,
    "mlperf_version": 1.0,
    "normalize_cores": 8,
    "normalize_processors": 8,
    "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/code",
    "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/results/NF5468M6_A100-PCIex8_TRT",
    "number_of_nodes": 1,
    "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)",
    "other_software_stack": "TensorRT 7.2, CUDA 11.1, cuDNN 8.0.2, DALI 0.25.0, Triton 20.09; GCC 7.5.0; Python 3.7.10",
    "performance_issue_same": 0,
    "performance_issue_same_index": 0,
    "performance_issue_unique": 0,
    "performance_sample_count": 64,
    "print_timestamps": 0,
    "problem": false,
    "qsl_rng_seed": 7322528924094909334,
    "retraining": "N",
    "sample_index_rng_seed": 1570999273408051088,
    "samples_per_query": 1,
    "schedule_rng_seed": 3507442325620259414,
    "starting_weights_filename": "resnet34-ssd1200.pytorch",
    "status": "Preview",
    "submitter": "Inspur",
    "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Inspur",
    "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)",
    "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/NF5468M6_A100-PCIex8_TRT",
    "system_name": "Microsoft Corporation 7.0 (Virtual Machine)",
    "system_type": "datacenter",
    "target_latency (ns)": 100000000,
    "target_qps": 6500,
    "task": "object detection",
    "task2": "object detection",
    "total_cores": 240,
    "uid": "783a2f4314c88b08",
    "use_accelerator": true,
    "weight_data_types": "int8",
    "weight_transformations": "quantization, affine fusion"
  },
  {
    "50.00 percentile latency (ns)": 50969655,
    "90.00 percentile latency (ns)": 73407854,
    "95.00 percentile latency (ns)": 81200844,
    "97.00 percentile latency (ns)": 87106116,
    "99.00 percentile latency (ns)": 94979773,
    "99.90 percentile latency (ns)": 103436553,
    "Completed samples per second": 7733.98,
    "Max latency (ns)": 110858018,
    "Mean latency (ns)": 51061596,
    "Min duration satisfied": "Yes",
    "Min latency (ns)": 16654703,
    "Min queries satisfied": "Yes",
    "Mode": "PerformanceOnly",
    "Performance constraints satisfied": "Yes",
    "Result is": "VALID",
    "SUT name": "LWIS_Server",
    "Scenario": "server",
    "Scheduled samples per second": 7734.85,
    "accelerator_frequency": "",
    "accelerator_host_interconnect": "",
    "accelerator_interconnect": "",
    "accelerator_interconnect_topology": "",
    "accelerator_memory_capacity": "80GB",
    "accelerator_memory_configuration": "HBM2",
    "accelerator_model_name": "NVIDIA A100-SXM-80GB",
    "accelerator_on-chip_memories": "",
    "accelerators_per_node": 8,
    "accuracy_log_probability": 0,
    "accuracy_log_rng_seed": 0,
    "accuracy_log_sampling_target": 0,
    "characteristics.mAP": 20.111,
    "characteristics.scheduled_queries_per_second": 7734.85,
    "characteristics.scheduled_queries_per_second.normalized_per_core": 966.85625,
    "characteristics.scheduled_queries_per_second.normalized_per_processor": 966.85625,
    "ck_system": "NF5488A5_A100-SXM-80GBx8_TRT",
    "ck_used": false,
    "cooling": "",
    "dataset": "COCO 2017 (300x300)",
    "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/coco2017.md",
    "dim_x_default": "characteristics.scheduled_queries_per_second",
    "dim_y_default": "characteristics.mAP",
    "dim_y_maximize": true,
    "division": "closed",
    "formal_model": "ssd-mobilenet",
    "formal_model_accuracy": 99.0,
    "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package",
    "framework": "TensorRT 7.2, CUDA 11.2",
    "host_memory_capacity": "1 TB",
    "host_memory_configuration": "",
    "host_networking": "",
    "host_networking_topology": "",
    "host_processor_caches": "",
    "host_processor_core_count": 64,
    "host_processor_frequency": "",
    "host_processor_interconnect": "",
    "host_processor_model_name": "AMD EPYC 7742",
    "host_processors_per_node": 2,
    "host_storage_capacity": "12 TB",
    "host_storage_type": "NVMe SSD",
    "hw_notes": "",
    "informal_model": "ssd-resnet34",
    "input_data_types": "int8",
    "key.accuracy": "characteristics.mAP",
    "max_async_queries": 0,
    "max_duration (ms)": 0,
    "max_query_count": 0,
    "min_duration (ms)": 600000,
    "min_query_count": 270336,
    "mlperf_version": 1.0,
    "normalize_cores": 8,
    "normalize_processors": 8,
    "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/code",
    "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Inspur/results/NF5488A5_A100-SXM-80GBx8_TRT",
    "number_of_nodes": 1,
    "operating_system": "Ubuntu 18.04.2",
    "other_software_stack": "TensorRT 7.2, CUDA 11.2, cuDNN 8.0.2, DALI 0.25.0, Triton 20.09",
    "performance_issue_same": 0,
    "performance_issue_same_index": 0,
    "performance_issue_unique": 0,
    "performance_sample_count": 64,
    "print_timestamps": 0,
    "problem": false,
    "qsl_rng_seed": 7322528924094909334,
    "retraining": "N",
    "sample_index_rng_seed": 1570999273408051088,
    "samples_per_query": 1,
    "schedule_rng_seed": 3507442325620259414,
    "starting_weights_filename": "resnet34-ssd1200.pytorch",
    "status": "available",
    "submitter": "Inspur",
    "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Inspur",
    "sw_notes": "",
    "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/NF5488A5_A100-SXM-80GBx8_TRT",
    "system_name": "NF5488A5",
    "system_type": "datacenter",
    "target_latency (ns)": 100000000,
    "target_qps": 7730,
    "task": "object detection",
    "task2": "object detection",
    "total_cores": 128,
    "uid": "9f8fc642498581e9",
    "use_accelerator": true,
    "weight_data_types": "int8",
    "weight_transformations": "quantization, affine fusion"
  },
  {
    "50.00 percentile latency (ns)": 30142783,
    "90.00 percentile latency (ns)": 63920615,
    "95.00 percentile latency (ns)": 71738335,
    "97.00 percentile latency (ns)": 77817616,
    "99.00 percentile latency (ns)": 84880678,
    "99.90 percentile latency (ns)": 92221013,
    "Completed samples per second": 7540.67,
    "Max latency (ns)": 96002142,
    "Mean latency (ns)": 35173416,
    "Min duration satisfied": "Yes",
    "Min latency (ns)": 16801797,
    "Min queries satisfied": "Yes",
    "Mode": "Performance",
    "Performance constraints satisfied": "Yes",
    "Result is": "VALID",
    "SUT name": "LWIS_Server",
    "Scenario": "server",
    "Scheduled samples per second": 7546.07,
    "accelerator_frequency": "1410MHz",
    "accelerator_host_interconnect": "PCIe Gen4 64 GB/s",
    "accelerator_interconnect": "NVLink 600 GB/s",
    "accelerator_interconnect_topology": "Mesh",
    "accelerator_memory_capacity": "40GB",
    "accelerator_memory_configuration": "HBM2",
    "accelerator_model_name": "NVIDIA A100-SXM4",
    "accelerator_on-chip_memories": "L1: 108x192KB, L2: 40MB per chip",
    "accelerators_per_node": 8,
    "accuracy_log_probability": 0,
    "accuracy_log_rng_seed": 0,
    "accuracy_log_sampling_target": 0,
    "characteristics.mAP": 20.111,
    "characteristics.scheduled_queries_per_second": 7546.07,
    "characteristics.scheduled_queries_per_second.normalized_per_core": 943.25875,
    "characteristics.scheduled_queries_per_second.normalized_per_processor": 943.25875,
    "ck_system": "DGX-A100_A100-SXM4x8_TRT",
    "ck_used": false,
    "cooling": "Air-cooled",
    "dataset": "COCO 2017 (300x300)",
    "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/coco2017.md",
    "dim_x_default": "characteristics.scheduled_queries_per_second",
    "dim_y_default": "characteristics.mAP",
    "dim_y_maximize": true,
    "division": "closed",
    "formal_model": "ssd-mobilenet",
    "formal_model_accuracy": 99.0,
    "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package",
    "framework": "TensorRT 7.2, CUDA 11.0.221",
    "host_memory_capacity": "1 TB",
    "host_memory_configuration": "16 x 64GB DDR4 2933 MT/s",
    "host_networking": "",
    "host_networking_topology": "",
    "host_processor_caches": "L1: 32KB I + 32KB D per core, L2: 512KB per core, L3: 256MB per chip",
    "host_processor_core_count": 64,
    "host_processor_frequency": "2.25GHz",
    "host_processor_interconnect": "4x 16GT/s xGMI",
    "host_processor_model_name": "AMD EPYC 7742",
    "host_processors_per_node": 2,
    "host_storage_capacity": "11.7TB + 445.7GB",
    "host_storage_type": "SSD",
    "hw_notes": "",
    "informal_model": "ssd-resnet34",
    "input_data_types": "int8",
    "key.accuracy": "characteristics.mAP",
    "max_async_queries": 0,
    "max_duration (ms)": 0,
    "max_query_count": 0,
    "min_duration (ms)": 60000,
    "min_query_count": 270336,
    "mlperf_version": 0.7,
    "normalize_cores": 8,
    "normalize_processors": 8,
    "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/Inspur/code",
    "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/Inspur/results/DGX-A100_A100-SXM4x8_TRT",
    "number_of_nodes": 1,
    "operating_system": "Ubuntu 18.04.4",
    "other_software_stack": "TensorRT 7.2, CUDA 11.0.221, cuDNN 8.0.2",
    "performance_issue_same": true,
    "performance_issue_same_index": 0,
    "performance_issue_unique": true,
    "performance_sample_count": 64,
    "print_timestamps": true,
    "problem": false,
    "qsl_rng_seed": 12786827339337101903,
    "retraining": "N",
    "sample_index_rng_seed": 12640797754436136668,
    "samples_per_query": 1,
    "schedule_rng_seed": 3135815929913719677,
    "starting_weights_filename": "resnet34-ssd1200.pytorch",
    "status": "on-premise",
    "submitter": "Inspur",
    "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Inspur",
    "sw_notes": "",
    "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/DGX-A100_A100-SXM4x8_TRT",
    "system_name": "NF5488A5",
    "system_type": "datacenter",
    "target_latency (ns)": 100000000,
    "target_qps": 7550,
    "task": "object detection",
    "task2": "object detection",
    "total_cores": 128,
    "uid": "4097a6dc546e595a",
    "use_accelerator": true,
    "weight_data_types": "int8,fp16",
    "weight_transformations": "quantization, affine fusion"
  },
  {
    "50.00 percentile latency (ns)": 40591790,
    "90.00 percentile latency (ns)": 65787169,
    "95.00 percentile latency (ns)": 74761718,
    "97.00 percentile latency (ns)": 81195890,
    "99.00 percentile latency (ns)": 92910521,
    "99.90 percentile latency (ns)": 110105958,
    "Completed samples per second": 1048.93,
    "Max latency (ns)": 123270263,
    "Mean latency (ns)": 44561894,
    "Min duration satisfied": "Yes",
    "Min latency (ns)": 22090564,
    "Min queries satisfied": "Yes",
    "Mode": "Performance",
    "Performance constraints satisfied": "Yes",
    "Result is": "VALID",
    "SUT name": "LWIS_Server",
    "Scenario": "server",
    "Scheduled samples per second": 1049.06,
    "accelerator_frequency": "1590MHz",
    "accelerator_host_interconnect": "PCIE",
    "accelerator_interconnect": "PCIE",
    "accelerator_interconnect_topology": "",
    "accelerator_memory_capacity": "16 GB",
    "accelerator_memory_configuration": "GDDR6",
    "accelerator_model_name": "NVIDIA T4",
    "accelerator_on-chip_memories": "",
    "accelerators_per_node": 8,
    "accuracy_log_probability": 0,
    "accuracy_log_rng_seed": 0,
    "accuracy_log_sampling_target": 0,
    "characteristics.mAP": 20.111,
    "characteristics.scheduled_queries_per_second": 1049.06,
    "characteristics.scheduled_queries_per_second.normalized_per_core": 131.1325,
    "characteristics.scheduled_queries_per_second.normalized_per_processor": 131.1325,
    "ck_system": "T4x8_TRT",
    "ck_used": false,
    "cooling": "Air-cooled",
    "dataset": "COCO 2017 (300x300)",
    "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/coco2017.md",
    "dim_x_default": "characteristics.scheduled_queries_per_second",
    "dim_y_default": "characteristics.mAP",
    "dim_y_maximize": true,
    "division": "closed",
    "formal_model": "ssd-mobilenet",
    "formal_model_accuracy": 99.0,
    "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package",
    "framework": "TensorRT 7.2, CUDA V11.0.221",
    "host_memory_capacity": "1.5T",
    "host_memory_configuration": "",
    "host_networking": "",
    "host_networking_topology": "",
    "host_processor_caches": "L1d cache: 32K, L1i cache: 32K, L2 cache: 1024K, L3 cache: 36608K",
    "host_processor_core_count": 24,
    "host_processor_frequency": "2.90GHz",
    "host_processor_interconnect": "",
    "host_processor_model_name": "Intel(R) Xeon(R) Platinum 8268 CPU @ 2.90GHz",
    "host_processors_per_node": 2,
    "host_storage_capacity": "2.9 TB",
    "host_storage_type": "SSD",
    "hw_notes": "ECC off",
    "informal_model": "ssd-resnet34",
    "input_data_types": "int8",
    "key.accuracy": "characteristics.mAP",
    "max_async_queries": 0,
    "max_duration (ms)": 0,
    "max_query_count": 0,
    "min_duration (ms)": 60000,
    "min_query_count": 270336,
    "mlperf_version": 0.7,
    "normalize_cores": 8,
    "normalize_processors": 8,
    "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/Inspur/code",
    "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/Inspur/results/T4x8_TRT",
    "number_of_nodes": 1,
    "operating_system": "Ubuntu 18.04.4",
    "other_software_stack": "TensorRT 7.2, CUDA V11.0.221, cuDNN 8.0.2, DALI 0.25.0",
    "performance_issue_same": true,
    "performance_issue_same_index": 0,
    "performance_issue_unique": true,
    "performance_sample_count": 64,
    "print_timestamps": true,
    "problem": false,
    "qsl_rng_seed": 12786827339337101903,
    "retraining": "N",
    "sample_index_rng_seed": 12640797754436136668,
    "samples_per_query": 1,
    "schedule_rng_seed": 3135815929913719677,
    "starting_weights_filename": "resnet34-ssd1200.pytorch",
    "status": "available",
    "submitter": "Inspur",
    "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Inspur",
    "sw_notes": "",
    "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/T4x8_TRT",
    "system_name": "NF5468M5",
    "system_type": "datacenter",
    "target_latency (ns)": 100000000,
    "target_qps": 1050,
    "task": "object detection",
    "task2": "object detection",
    "total_cores": 48,
    "uid": "f9e659e89b48c498",
    "use_accelerator": true,
    "weight_data_types": "int8,fp16",
    "weight_transformations": "quantization, affine fusion"
  }
]