[ { "50.00 percentile latency (ns)": 1352226, "90.00 percentile latency (ns)": 1490246, "90th percentile latency (ns)": 1490246, "95.00 percentile latency (ns)": 1613261, "97.00 percentile latency (ns)": 1972829, "99.00 percentile latency (ns)": 2908395, "99.90 percentile latency (ns)": 21150298, "Max latency (ns)": 74481020, "Mean latency (ns)": 1462121, "Min duration satisfied": "Yes", "Min latency (ns)": 1166743, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 682.05, "QPS w/o loadgen overhead": 683.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 1.490246, "characteristics.90th_percentile_latency_ns": 1490246.0, "characteristics.90th_percentile_latency_s": 0.001490246, "characteristics.90th_percentile_latency_us": 1490.246, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.power": 0.031754423776451386, "characteristics.power.normalized_per_core": 0.00026462019813709486, "characteristics.power.normalized_per_processor": 0.031754423776451386, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "894c87afaa46c7e0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1797659, "90.00 percentile latency (ns)": 1980312, "90th percentile latency (ns)": 1980312, "95.00 percentile latency (ns)": 2217748, "97.00 percentile latency (ns)": 2738703, "99.00 percentile latency (ns)": 3926381, "99.90 percentile latency (ns)": 24750498, "Max latency (ns)": 79677783, "Mean latency (ns)": 1946044, "Min duration satisfied": "Yes", "Min latency (ns)": 1534979, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 512.4, "QPS w/o loadgen overhead": 513.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 1.980312, "characteristics.90th_percentile_latency_ns": 1980312.0, "characteristics.90th_percentile_latency_s": 0.001980312, "characteristics.90th_percentile_latency_us": 1980.312, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.power": 0.04418067430524521, "characteristics.power.normalized_per_core": 0.0003681722858770434, "characteristics.power.normalized_per_processor": 0.04418067430524521, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ae2c542b89f67a57", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1793200, "90.00 percentile latency (ns)": 2078708, "90th percentile latency (ns)": 2078708, "95.00 percentile latency (ns)": 2604874, "97.00 percentile latency (ns)": 3208292, "99.00 percentile latency (ns)": 5023074, "99.90 percentile latency (ns)": 25801481, "Max latency (ns)": 99697130, "Mean latency (ns)": 1999008, "Min duration satisfied": "Yes", "Min latency (ns)": 1538143, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 498.19, "QPS w/o loadgen overhead": 500.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.078708, "characteristics.90th_percentile_latency_ns": 2078708.0, "characteristics.90th_percentile_latency_s": 0.002078708, "characteristics.90th_percentile_latency_us": 2078.708, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.power": 0.04598345892028677, "characteristics.power.normalized_per_core": 0.00038319549100238975, "characteristics.power.normalized_per_processor": 0.04598345892028677, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dd5afad93e4dcdba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1961159, "90.00 percentile latency (ns)": 2230709, "90th percentile latency (ns)": 2230709, "95.00 percentile latency (ns)": 2512715, "97.00 percentile latency (ns)": 3075935, "99.00 percentile latency (ns)": 4424100, "99.90 percentile latency (ns)": 25260456, "Max latency (ns)": 79646906, "Mean latency (ns)": 2142206, "Min duration satisfied": "Yes", "Min latency (ns)": 1749051, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 465.05, "QPS w/o loadgen overhead": 466.81, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.230709, "characteristics.90th_percentile_latency_ns": 2230709.0, "characteristics.90th_percentile_latency_s": 0.002230709, "characteristics.90th_percentile_latency_us": 2230.709, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.power": 0.052892413002186195, "characteristics.power.normalized_per_core": 0.00044077010835155163, "characteristics.power.normalized_per_processor": 0.052892413002186195, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "cf74602bfdfc48c2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2312751, "90.00 percentile latency (ns)": 2690979, "90th percentile latency (ns)": 2690979, "95.00 percentile latency (ns)": 3341601, "97.00 percentile latency (ns)": 4109281, "99.00 percentile latency (ns)": 6640792, "99.90 percentile latency (ns)": 27254171, "Max latency (ns)": 135076480, "Mean latency (ns)": 2559402, "Min duration satisfied": "Yes", "Min latency (ns)": 1979805, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 388.89, "QPS w/o loadgen overhead": 390.72, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.690979, "characteristics.90th_percentile_latency_ns": 2690979.0, "characteristics.90th_percentile_latency_s": 0.002690979, "characteristics.90th_percentile_latency_us": 2690.979, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.power": 0.059463551778375, "characteristics.power.normalized_per_core": 0.000495529598153125, "characteristics.power.normalized_per_processor": 0.059463551778375, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "268f3245a4789b1d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2700409, "90.00 percentile latency (ns)": 3094475, "90th percentile latency (ns)": 3094475, "95.00 percentile latency (ns)": 3756230, "97.00 percentile latency (ns)": 4688530, "99.00 percentile latency (ns)": 7412361, "99.90 percentile latency (ns)": 31629666, "Max latency (ns)": 129703256, "Mean latency (ns)": 2986152, "Min duration satisfied": "Yes", "Min latency (ns)": 2375146, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 333.41, "QPS w/o loadgen overhead": 334.88, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.094475, "characteristics.90th_percentile_latency_ns": 3094475.0, "characteristics.90th_percentile_latency_s": 0.003094475, "characteristics.90th_percentile_latency_us": 3094.475, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.power": 0.06978711151901237, "characteristics.power.normalized_per_core": 0.0005815592626584365, "characteristics.power.normalized_per_processor": 0.06978711151901237, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1b89af5c5d598997", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2825661, "90.00 percentile latency (ns)": 3094634, "90th percentile latency (ns)": 3094634, "95.00 percentile latency (ns)": 3338741, "97.00 percentile latency (ns)": 4025266, "99.00 percentile latency (ns)": 6713771, "99.90 percentile latency (ns)": 30102933, "Max latency (ns)": 88748386, "Mean latency (ns)": 3032182, "Min duration satisfied": "Yes", "Min latency (ns)": 2574322, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 328.37, "QPS w/o loadgen overhead": 329.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.094634, "characteristics.90th_percentile_latency_ns": 3094634.0, "characteristics.90th_percentile_latency_s": 0.003094634, "characteristics.90th_percentile_latency_us": 3094.634, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.power": 0.07566949172328459, "characteristics.power.normalized_per_core": 0.0006305790976940382, "characteristics.power.normalized_per_processor": 0.07566949172328459, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a47328cde011d0dd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3073165, "90.00 percentile latency (ns)": 3740908, "90th percentile latency (ns)": 3740908, "95.00 percentile latency (ns)": 4767984, "97.00 percentile latency (ns)": 5522192, "99.00 percentile latency (ns)": 8243549, "99.90 percentile latency (ns)": 39900496, "Max latency (ns)": 80866685, "Mean latency (ns)": 3405683, "Min duration satisfied": "Yes", "Min latency (ns)": 2764482, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 292.48, "QPS w/o loadgen overhead": 293.63, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.740908, "characteristics.90th_percentile_latency_ns": 3740908.0, "characteristics.90th_percentile_latency_s": 0.003740908, "characteristics.90th_percentile_latency_us": 3740.908, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.power": 0.08846718431420815, "characteristics.power.normalized_per_core": 0.0007372265359517346, "characteristics.power.normalized_per_processor": 0.08846718431420815, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3519eedc512975fe", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4190750, "90.00 percentile latency (ns)": 4911710, "90th percentile latency (ns)": 4911710, "95.00 percentile latency (ns)": 5879947, "97.00 percentile latency (ns)": 7038303, "99.00 percentile latency (ns)": 10796201, "99.90 percentile latency (ns)": 48957002, "Max latency (ns)": 115493842, "Mean latency (ns)": 4571596, "Min duration satisfied": "Yes", "Min latency (ns)": 3687015, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 217.88, "QPS w/o loadgen overhead": 218.74, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.91171, "characteristics.90th_percentile_latency_ns": 4911710.0, "characteristics.90th_percentile_latency_s": 0.00491171, "characteristics.90th_percentile_latency_us": 4911.71, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.power": 0.10671707552149078, "characteristics.power.normalized_per_core": 0.0008893089626790898, "characteristics.power.normalized_per_processor": 0.10671707552149078, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f074e9ba8f508a41", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4619376, "90.00 percentile latency (ns)": 5305251, "90th percentile latency (ns)": 5305251, "95.00 percentile latency (ns)": 6239929, "97.00 percentile latency (ns)": 7514482, "99.00 percentile latency (ns)": 11782674, "99.90 percentile latency (ns)": 52385660, "Max latency (ns)": 114098887, "Mean latency (ns)": 5022017, "Min duration satisfied": "Yes", "Min latency (ns)": 4153645, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 198.35, "QPS w/o loadgen overhead": 199.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.305251, "characteristics.90th_percentile_latency_ns": 5305251.0, "characteristics.90th_percentile_latency_s": 0.005305251, "characteristics.90th_percentile_latency_us": 5305.251, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.power": 0.11993390404743177, "characteristics.power.normalized_per_core": 0.0009994492003952647, "characteristics.power.normalized_per_processor": 0.11993390404743177, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a38a7744dc38f27e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4726689, "90.00 percentile latency (ns)": 6070641, "90th percentile latency (ns)": 6070641, "95.00 percentile latency (ns)": 7117619, "97.00 percentile latency (ns)": 8207291, "99.00 percentile latency (ns)": 11350114, "99.90 percentile latency (ns)": 27219152, "Max latency (ns)": 122064324, "Mean latency (ns)": 5174687, "Min duration satisfied": "Yes", "Min latency (ns)": 4133674, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 192.67, "QPS w/o loadgen overhead": 193.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.070641, "characteristics.90th_percentile_latency_ns": 6070641.0, "characteristics.90th_percentile_latency_s": 0.006070641, "characteristics.90th_percentile_latency_us": 6070.641, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.power": 0.12228502325195159, "characteristics.power.normalized_per_core": 0.015285627906493949, "characteristics.power.normalized_per_processor": 0.12228502325195159, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "08af2a22a14371a6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5749243, "90.00 percentile latency (ns)": 6680630, "90th percentile latency (ns)": 6680630, "95.00 percentile latency (ns)": 7778289, "97.00 percentile latency (ns)": 9178566, "99.00 percentile latency (ns)": 13542223, "99.90 percentile latency (ns)": 67815831, "Max latency (ns)": 129020392, "Mean latency (ns)": 6237201, "Min duration satisfied": "Yes", "Min latency (ns)": 5069019, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 159.86, "QPS w/o loadgen overhead": 160.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.68063, "characteristics.90th_percentile_latency_ns": 6680630.0, "characteristics.90th_percentile_latency_s": 0.00668063, "characteristics.90th_percentile_latency_us": 6680.63, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.power": 0.1592659201801576, "characteristics.power.normalized_per_core": 0.0013272160015013132, "characteristics.power.normalized_per_processor": 0.1592659201801576, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f384e48d498ab40b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6883796, "90.00 percentile latency (ns)": 8377014, "90th percentile latency (ns)": 8377014, "95.00 percentile latency (ns)": 10224424, "97.00 percentile latency (ns)": 12021752, "99.00 percentile latency (ns)": 16800749, "99.90 percentile latency (ns)": 65809241, "Max latency (ns)": 85384163, "Mean latency (ns)": 7544478, "Min duration satisfied": "Yes", "Min latency (ns)": 6297145, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 132.24, "QPS w/o loadgen overhead": 132.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.377014, "characteristics.90th_percentile_latency_ns": 8377014.0, "characteristics.90th_percentile_latency_s": 0.008377014, "characteristics.90th_percentile_latency_us": 8377.014, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.power": 0.19748860691852427, "characteristics.power.normalized_per_core": 0.0016457383909877022, "characteristics.power.normalized_per_processor": 0.19748860691852427, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "06f9bb8477fb082b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7446929, "90.00 percentile latency (ns)": 9102716, "90th percentile latency (ns)": 9102716, "95.00 percentile latency (ns)": 11797846, "97.00 percentile latency (ns)": 13773039, "99.00 percentile latency (ns)": 18643532, "99.90 percentile latency (ns)": 78123440, "Max latency (ns)": 124748973, "Mean latency (ns)": 8213634, "Min duration satisfied": "Yes", "Min latency (ns)": 6851446, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 121.43, "QPS w/o loadgen overhead": 121.75, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.102716, "characteristics.90th_percentile_latency_ns": 9102716.0, "characteristics.90th_percentile_latency_s": 0.009102716, "characteristics.90th_percentile_latency_us": 9102.716, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.power": 0.2078457289839437, "characteristics.power.normalized_per_core": 0.0017320477415328642, "characteristics.power.normalized_per_processor": 0.2078457289839437, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f5ad4433413444fd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7663810, "90.00 percentile latency (ns)": 9368466, "90th percentile latency (ns)": 9368466, "95.00 percentile latency (ns)": 11834601, "97.00 percentile latency (ns)": 13890645, "99.00 percentile latency (ns)": 19110465, "99.90 percentile latency (ns)": 79740440, "Max latency (ns)": 125161946, "Mean latency (ns)": 8408980, "Min duration satisfied": "Yes", "Min latency (ns)": 7076032, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 118.68, "QPS w/o loadgen overhead": 118.92, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.368466, "characteristics.90th_percentile_latency_ns": 9368466.0, "characteristics.90th_percentile_latency_s": 0.009368466, "characteristics.90th_percentile_latency_us": 9368.466, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.power": 0.20973861826638668, "characteristics.power.normalized_per_core": 0.0017478218188865557, "characteristics.power.normalized_per_processor": 0.20973861826638668, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0a0453d8af8a9b45", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8329839, "90.00 percentile latency (ns)": 10870741, "90th percentile latency (ns)": 10870741, "95.00 percentile latency (ns)": 13082354, "97.00 percentile latency (ns)": 14579438, "99.00 percentile latency (ns)": 17455318, "99.90 percentile latency (ns)": 35811343, "Max latency (ns)": 116077835, "Mean latency (ns)": 9040099, "Min duration satisfied": "Yes", "Min latency (ns)": 7282705, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 110.41, "QPS w/o loadgen overhead": 110.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.870741, "characteristics.90th_percentile_latency_ns": 10870741.0, "characteristics.90th_percentile_latency_s": 0.010870741, "characteristics.90th_percentile_latency_us": 10870.741, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.power": 0.22525088761683926, "characteristics.power.normalized_per_core": 0.028156360952104907, "characteristics.power.normalized_per_processor": 0.22525088761683926, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "3941858e66b2e472", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9259048, "90.00 percentile latency (ns)": 11655958, "90th percentile latency (ns)": 11655958, "95.00 percentile latency (ns)": 14440246, "97.00 percentile latency (ns)": 16079392, "99.00 percentile latency (ns)": 24294201, "99.90 percentile latency (ns)": 84365622, "Max latency (ns)": 123385970, "Mean latency (ns)": 10177933, "Min duration satisfied": "Yes", "Min latency (ns)": 8653804, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 98.09, "QPS w/o loadgen overhead": 98.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.655958, "characteristics.90th_percentile_latency_ns": 11655958.0, "characteristics.90th_percentile_latency_s": 0.011655958, "characteristics.90th_percentile_latency_us": 11655.958, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.power": 0.2562544326195942, "characteristics.power.normalized_per_core": 0.0021354536051632848, "characteristics.power.normalized_per_processor": 0.2562544326195942, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b478bb49d131fcc6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10797839, "90.00 percentile latency (ns)": 15940268, "90th percentile latency (ns)": 15940268, "95.00 percentile latency (ns)": 17383854, "97.00 percentile latency (ns)": 18298840, "99.00 percentile latency (ns)": 22575078, "99.90 percentile latency (ns)": 40797362, "Max latency (ns)": 142581766, "Mean latency (ns)": 11984913, "Min duration satisfied": "Yes", "Min latency (ns)": 8960269, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 83.32, "QPS w/o loadgen overhead": 83.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.940268, "characteristics.90th_percentile_latency_ns": 15940268.0, "characteristics.90th_percentile_latency_s": 0.015940268, "characteristics.90th_percentile_latency_us": 15940.268, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.power": 0.30112926675676444, "characteristics.power.normalized_per_core": 0.037641158344595554, "characteristics.power.normalized_per_processor": 0.30112926675676444, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "14f6b900d0244ebc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16788660, "90.00 percentile latency (ns)": 21488871, "90th percentile latency (ns)": 21488871, "95.00 percentile latency (ns)": 23942219, "97.00 percentile latency (ns)": 24711608, "99.00 percentile latency (ns)": 33368065, "99.90 percentile latency (ns)": 83772813, "Max latency (ns)": 129348687, "Mean latency (ns)": 17594625, "Min duration satisfied": "Yes", "Min latency (ns)": 14104111, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 56.77, "QPS w/o loadgen overhead": 56.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.488871, "characteristics.90th_percentile_latency_ns": 21488871.0, "characteristics.90th_percentile_latency_s": 0.021488871, "characteristics.90th_percentile_latency_us": 21488.871, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.4705830893862166, "characteristics.power.normalized_per_core": 0.003921525744885138, "characteristics.power.normalized_per_processor": 0.4705830893862166, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5f8a4ad99a7b1c38", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19622143, "90.00 percentile latency (ns)": 26600140, "90th percentile latency (ns)": 26600140, "95.00 percentile latency (ns)": 28258624, "97.00 percentile latency (ns)": 29684798, "99.00 percentile latency (ns)": 35725489, "99.90 percentile latency (ns)": 62252058, "Max latency (ns)": 166883444, "Mean latency (ns)": 21095843, "Min duration satisfied": "Yes", "Min latency (ns)": 14512555, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 47.36, "QPS w/o loadgen overhead": 47.4, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.60014, "characteristics.90th_percentile_latency_ns": 26600140.0, "characteristics.90th_percentile_latency_s": 0.02660014, "characteristics.90th_percentile_latency_us": 26600.14, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.5576905886567809, "characteristics.power.normalized_per_core": 0.06971132358209761, "characteristics.power.normalized_per_processor": 0.5576905886567809, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "953f4e89b4a6da04", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 23427399, "90.00 percentile latency (ns)": 26739832, "90th percentile latency (ns)": 26739832, "95.00 percentile latency (ns)": 28830304, "97.00 percentile latency (ns)": 31265283, "99.00 percentile latency (ns)": 34962493, "99.90 percentile latency (ns)": 40453465, "Max latency (ns)": 46891204, "Mean latency (ns)": 22150857, "Min duration satisfied": "Yes", "Min latency (ns)": 14406313, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 45.11, "QPS w/o loadgen overhead": 45.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.739832, "characteristics.90th_percentile_latency_ns": 26739832.0, "characteristics.90th_percentile_latency_s": 0.026739832, "characteristics.90th_percentile_latency_us": 26739.832, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.38791699366981014, "characteristics.power.normalized_per_core": 0.0032326416139150846, "characteristics.power.normalized_per_processor": 0.38791699366981014, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6c8910ed44661b44", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20342460, "90.00 percentile latency (ns)": 27726474, "90th percentile latency (ns)": 27726474, "95.00 percentile latency (ns)": 29065095, "97.00 percentile latency (ns)": 30234588, "99.00 percentile latency (ns)": 39332282, "99.90 percentile latency (ns)": 86504020, "Max latency (ns)": 118384094, "Mean latency (ns)": 22009131, "Min duration satisfied": "Yes", "Min latency (ns)": 19306924, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 45.39, "QPS w/o loadgen overhead": 45.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 27.726474, "characteristics.90th_percentile_latency_ns": 27726474.0, "characteristics.90th_percentile_latency_s": 0.027726474, "characteristics.90th_percentile_latency_us": 27726.474, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.6037751021712061, "characteristics.power.normalized_per_core": 0.005031459184760051, "characteristics.power.normalized_per_processor": 0.6037751021712061, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ef9ba73c5cff8dd1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 23141503, "90.00 percentile latency (ns)": 31213763, "90th percentile latency (ns)": 31213763, "95.00 percentile latency (ns)": 33347777, "97.00 percentile latency (ns)": 34967082, "99.00 percentile latency (ns)": 40400819, "99.90 percentile latency (ns)": 65093580, "Max latency (ns)": 159535848, "Mean latency (ns)": 24855275, "Min duration satisfied": "Yes", "Min latency (ns)": 19252331, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 40.2, "QPS w/o loadgen overhead": 40.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 31.213763, "characteristics.90th_percentile_latency_ns": 31213763.0, "characteristics.90th_percentile_latency_s": 0.031213763, "characteristics.90th_percentile_latency_us": 31213.763, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.666459757385989, "characteristics.power.normalized_per_core": 0.08330746967324862, "characteristics.power.normalized_per_processor": 0.666459757385989, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "842f898b904795bf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30682885, "90.00 percentile latency (ns)": 34792199, "90th percentile latency (ns)": 34792199, "95.00 percentile latency (ns)": 37222849, "97.00 percentile latency (ns)": 39734486, "99.00 percentile latency (ns)": 43286468, "99.90 percentile latency (ns)": 48818565, "Max latency (ns)": 65067644, "Mean latency (ns)": 28829886, "Min duration satisfied": "Yes", "Min latency (ns)": 18089721, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.67, "QPS w/o loadgen overhead": 34.69, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 34.792199, "characteristics.90th_percentile_latency_ns": 34792199.0, "characteristics.90th_percentile_latency_s": 0.034792199, "characteristics.90th_percentile_latency_us": 34792.199, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.516139686898728, "characteristics.power.normalized_per_core": 0.0043011640574894, "characteristics.power.normalized_per_processor": 0.516139686898728, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d83ed0145c7a6a48", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 31470866, "90.00 percentile latency (ns)": 42720272, "90th percentile latency (ns)": 42720272, "95.00 percentile latency (ns)": 46836714, "97.00 percentile latency (ns)": 48511990, "99.00 percentile latency (ns)": 56649510, "99.90 percentile latency (ns)": 102651561, "Max latency (ns)": 147487515, "Mean latency (ns)": 34598096, "Min duration satisfied": "Yes", "Min latency (ns)": 28584271, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 28.89, "QPS w/o loadgen overhead": 28.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.720272, "characteristics.90th_percentile_latency_ns": 42720272.0, "characteristics.90th_percentile_latency_s": 0.042720272, "characteristics.90th_percentile_latency_us": 42720.272, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 0.958766485155427, "characteristics.power.normalized_per_core": 0.007989720709628558, "characteristics.power.normalized_per_processor": 0.958766485155427, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "90c448fbab575c79", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 37212736, "90.00 percentile latency (ns)": 47939220, "90th percentile latency (ns)": 47939220, "95.00 percentile latency (ns)": 50026309, "97.00 percentile latency (ns)": 51663493, "99.00 percentile latency (ns)": 59581559, "99.90 percentile latency (ns)": 112591195, "Max latency (ns)": 180817905, "Mean latency (ns)": 39322589, "Min duration satisfied": "Yes", "Min latency (ns)": 29585939, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 25.42, "QPS w/o loadgen overhead": 25.43, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 47.93922, "characteristics.90th_percentile_latency_ns": 47939220.0, "characteristics.90th_percentile_latency_s": 0.04793922, "characteristics.90th_percentile_latency_us": 47939.22, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 1.0711029627764492, "characteristics.power.normalized_per_core": 0.13388787034705615, "characteristics.power.normalized_per_processor": 1.0711029627764492, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 28.5714, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "d1d4ca0b9474c930", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 27083021, "90.00 percentile latency (ns)": 49307993, "90th percentile latency (ns)": 49307993, "95.00 percentile latency (ns)": 51988858, "97.00 percentile latency (ns)": 54509321, "99.00 percentile latency (ns)": 59493648, "99.90 percentile latency (ns)": 66443721, "Max latency (ns)": 84040221, "Mean latency (ns)": 34796353, "Min duration satisfied": "Yes", "Min latency (ns)": 25253254, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 28.72, "QPS w/o loadgen overhead": 28.74, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 49.307993, "characteristics.90th_percentile_latency_ns": 49307993.0, "characteristics.90th_percentile_latency_s": 0.049307993, "characteristics.90th_percentile_latency_us": 49307.993, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 0.6955684443717224, "characteristics.power.normalized_per_core": 0.005796403703097686, "characteristics.power.normalized_per_processor": 0.6955684443717224, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "eebf44121a23747c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 52390715, "90.00 percentile latency (ns)": 67754253, "90th percentile latency (ns)": 67754253, "95.00 percentile latency (ns)": 70348269, "97.00 percentile latency (ns)": 73303283, "99.00 percentile latency (ns)": 82868245, "99.90 percentile latency (ns)": 135484751, "Max latency (ns)": 168887474, "Mean latency (ns)": 56749943, "Min duration satisfied": "Yes", "Min latency (ns)": 48470052, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.62, "QPS w/o loadgen overhead": 17.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 67.754253, "characteristics.90th_percentile_latency_ns": 67754253.0, "characteristics.90th_percentile_latency_s": 0.067754253, "characteristics.90th_percentile_latency_us": 67754.253, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.5957546841665073, "characteristics.power.normalized_per_core": 0.013297955701387561, "characteristics.power.normalized_per_processor": 1.5957546841665073, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2874bef9b97dfa09", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 63751339, "90.00 percentile latency (ns)": 76286615, "90th percentile latency (ns)": 76286615, "95.00 percentile latency (ns)": 80711803, "97.00 percentile latency (ns)": 83761760, "99.00 percentile latency (ns)": 91016661, "99.90 percentile latency (ns)": 171047730, "Max latency (ns)": 201351097, "Mean latency (ns)": 64052072, "Min duration satisfied": "Yes", "Min latency (ns)": 48646093, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.61, "QPS w/o loadgen overhead": 15.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 76.286615, "characteristics.90th_percentile_latency_ns": 76286615.0, "characteristics.90th_percentile_latency_s": 0.076286615, "characteristics.90th_percentile_latency_us": 76286.615, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.7779469701414228, "characteristics.power.normalized_per_core": 0.22224337126767785, "characteristics.power.normalized_per_processor": 1.7779469701414228, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.625, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4cc28837a2cf0f40", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 42843911, "90.00 percentile latency (ns)": 77314084, "90th percentile latency (ns)": 77314084, "95.00 percentile latency (ns)": 81061939, "97.00 percentile latency (ns)": 83912242, "99.00 percentile latency (ns)": 91711307, "99.90 percentile latency (ns)": 99747516, "Max latency (ns)": 105543697, "Mean latency (ns)": 50065569, "Min duration satisfied": "Yes", "Min latency (ns)": 40976028, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.97, "QPS w/o loadgen overhead": 19.97, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 77.314084, "characteristics.90th_percentile_latency_ns": 77314084.0, "characteristics.90th_percentile_latency_s": 0.077314084, "characteristics.90th_percentile_latency_us": 77314.084, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.105265486356313, "characteristics.power.normalized_per_core": 0.009210545719635942, "characteristics.power.normalized_per_processor": 1.105265486356313, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "784baeb0e09e933b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 264639122, "90.00 percentile latency (ns)": 285170420, "90th percentile latency (ns)": 285170420, "95.00 percentile latency (ns)": 299276097, "97.00 percentile latency (ns)": 353649016, "99.00 percentile latency (ns)": 418448499, "99.90 percentile latency (ns)": 423447616, "Max latency (ns)": 430766958, "Mean latency (ns)": 274857246, "Min duration satisfied": "Yes", "Min latency (ns)": 261124786, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.64, "QPS w/o loadgen overhead": 3.64, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 285.17042, "characteristics.90th_percentile_latency_ns": 285170420.0, "characteristics.90th_percentile_latency_s": 0.28517042, "characteristics.90th_percentile_latency_us": 285170.42, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.8938073692910153, "characteristics.power.normalized_per_core": 0.015781728077425127, "characteristics.power.normalized_per_processor": 1.8938073692910153, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.62319, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f830a9b1ca8aac37", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 330079270, "90.00 percentile latency (ns)": 350427079, "90th percentile latency (ns)": 350427079, "95.00 percentile latency (ns)": 353426040, "97.00 percentile latency (ns)": 357431632, "99.00 percentile latency (ns)": 429357518, "99.90 percentile latency (ns)": 474229017, "Max latency (ns)": 482662101, "Mean latency (ns)": 336223383, "Min duration satisfied": "Yes", "Min latency (ns)": 326448781, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.97, "QPS w/o loadgen overhead": 2.97, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 350.427079, "characteristics.90th_percentile_latency_ns": 350427079.0, "characteristics.90th_percentile_latency_s": 0.350427079, "characteristics.90th_percentile_latency_us": 350427.079, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.92398, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "d84c1cf52925237c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 333924933, "90.00 percentile latency (ns)": 352801253, "90th percentile latency (ns)": 352801253, "95.00 percentile latency (ns)": 362539452, "97.00 percentile latency (ns)": 365196629, "99.00 percentile latency (ns)": 374068175, "99.90 percentile latency (ns)": 496080162, "Max latency (ns)": 505116722, "Mean latency (ns)": 341057531, "Min duration satisfied": "Yes", "Min latency (ns)": 328901548, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.93, "QPS w/o loadgen overhead": 2.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 352.801253, "characteristics.90th_percentile_latency_ns": 352801253.0, "characteristics.90th_percentile_latency_s": 0.352801253, "characteristics.90th_percentile_latency_us": 352801.253, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 2.440523948083906, "characteristics.power.normalized_per_core": 0.02033769956736588, "characteristics.power.normalized_per_processor": 2.440523948083906, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.92398, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "586ad300f50124fd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 361745630, "90.00 percentile latency (ns)": 362824084, "90th percentile latency (ns)": 362824084, "95.00 percentile latency (ns)": 363577611, "97.00 percentile latency (ns)": 364416736, "99.00 percentile latency (ns)": 365534448, "99.90 percentile latency (ns)": 453861036, "Max latency (ns)": 516532787, "Mean latency (ns)": 362145779, "Min duration satisfied": "Yes", "Min latency (ns)": 360074226, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.76, "QPS w/o loadgen overhead": 2.76, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 362.824084, "characteristics.90th_percentile_latency_ns": 362824084.0, "characteristics.90th_percentile_latency_s": 0.362824084, "characteristics.90th_percentile_latency_us": 362824.084, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.76243, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a8634abeee3401e7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 479143617, "90.00 percentile latency (ns)": 481495572, "90th percentile latency (ns)": 481495572, "95.00 percentile latency (ns)": 482713587, "97.00 percentile latency (ns)": 484626298, "99.00 percentile latency (ns)": 489298256, "99.90 percentile latency (ns)": 505017013, "Max latency (ns)": 507408394, "Mean latency (ns)": 479205108, "Min duration satisfied": "Yes", "Min latency (ns)": 463269958, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.09, "QPS w/o loadgen overhead": 2.09, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 481.495572, "characteristics.90th_percentile_latency_ns": 481495572.0, "characteristics.90th_percentile_latency_s": 0.481495572, "characteristics.90th_percentile_latency_us": 481495.572, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.079, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ff45c3a080c5f913", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 493166225, "90.00 percentile latency (ns)": 545062465, "90th percentile latency (ns)": 545062465, "95.00 percentile latency (ns)": 558331316, "97.00 percentile latency (ns)": 563402405, "99.00 percentile latency (ns)": 578899309, "99.90 percentile latency (ns)": 603919584, "Max latency (ns)": 606813127, "Mean latency (ns)": 486407759, "Min duration satisfied": "Yes", "Min latency (ns)": 317799355, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.06, "QPS w/o loadgen overhead": 2.06, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 545.062465, "characteristics.90th_percentile_latency_ns": 545062465.0, "characteristics.90th_percentile_latency_s": 0.545062465, "characteristics.90th_percentile_latency_us": 545062.465, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.04082, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "237952b68714db67", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 503220677, "90.00 percentile latency (ns)": 554081097, "90th percentile latency (ns)": 554081097, "95.00 percentile latency (ns)": 564939845, "97.00 percentile latency (ns)": 570244085, "99.00 percentile latency (ns)": 581902871, "99.90 percentile latency (ns)": 593908142, "Max latency (ns)": 600536536, "Mean latency (ns)": 497972933, "Min duration satisfied": "Yes", "Min latency (ns)": 318925265, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.01, "QPS w/o loadgen overhead": 2.01, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 554.081097, "characteristics.90th_percentile_latency_ns": 554081097.0, "characteristics.90th_percentile_latency_s": 0.554081097, "characteristics.90th_percentile_latency_us": 554081.097, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.04082, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "02880a45438743e0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" } ]