[ { "50.00 percentile latency (ns)": 148086860, "90.00 percentile latency (ns)": 165668909, "90th percentile latency (ns)": 165668909, "95.00 percentile latency (ns)": 173868346, "97.00 percentile latency (ns)": 178224314, "99.00 percentile latency (ns)": 190472178, "99.90 percentile latency (ns)": 206563153, "Max latency (ns)": 221780726, "Mean latency (ns)": 152230093, "Min duration satisfied": "Yes", "Min latency (ns)": 140674572, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 6.57, "QPS w/o loadgen overhead": 6.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 165.668909, "characteristics.90th_percentile_latency_ns": 165668909.0, "characteristics.90th_percentile_latency_s": 0.165668909, "characteristics.90th_percentile_latency_us": 165668.909, "characteristics.accuracy": 78.504, "characteristics.good": 39252, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7484d9692212b533", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20222343, "90.00 percentile latency (ns)": 24951905, "90th percentile latency (ns)": 24951905, "95.00 percentile latency (ns)": 28925945, "97.00 percentile latency (ns)": 31787068, "99.00 percentile latency (ns)": 39087438, "99.90 percentile latency (ns)": 78464745, "Max latency (ns)": 95929584, "Mean latency (ns)": 21788420, "Min duration satisfied": "Yes", "Min latency (ns)": 19585033, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 45.86, "QPS w/o loadgen overhead": 45.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.951905, "characteristics.90th_percentile_latency_ns": 24951905.0, "characteristics.90th_percentile_latency_s": 0.024951905, "characteristics.90th_percentile_latency_us": 24951.905, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dc83b4cb1b5b3e5e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 41632101, "90.00 percentile latency (ns)": 58106367, "90th percentile latency (ns)": 58106367, "95.00 percentile latency (ns)": 64013712, "97.00 percentile latency (ns)": 66899061, "99.00 percentile latency (ns)": 77086444, "99.90 percentile latency (ns)": 107417416, "Max latency (ns)": 181683730, "Mean latency (ns)": 45859621, "Min duration satisfied": "Yes", "Min latency (ns)": 39408575, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 21.8, "QPS w/o loadgen overhead": 21.81, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 58.106367, "characteristics.90th_percentile_latency_ns": 58106367.0, "characteristics.90th_percentile_latency_s": 0.058106367, "characteristics.90th_percentile_latency_us": 58106.367, "characteristics.accuracy": 74.022, "characteristics.good": 37011, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4a99a4443aadc0a1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 35847680, "90.00 percentile latency (ns)": 45196617, "90th percentile latency (ns)": 45196617, "95.00 percentile latency (ns)": 48908869, "97.00 percentile latency (ns)": 51001596, "99.00 percentile latency (ns)": 58522712, "99.90 percentile latency (ns)": 67820318, "Max latency (ns)": 76415110, "Mean latency (ns)": 38225948, "Min duration satisfied": "Yes", "Min latency (ns)": 34282367, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 26.15, "QPS w/o loadgen overhead": 26.16, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 45.196617, "characteristics.90th_percentile_latency_ns": 45196617.0, "characteristics.90th_percentile_latency_s": 0.045196617, "characteristics.90th_percentile_latency_us": 45196.617, "characteristics.accuracy": 72.9, "characteristics.good": 36450, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d43e0a64bc38e91c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 58978532, "90.00 percentile latency (ns)": 72326317, "90th percentile latency (ns)": 72326317, "95.00 percentile latency (ns)": 76539503, "97.00 percentile latency (ns)": 80146997, "99.00 percentile latency (ns)": 87796408, "99.90 percentile latency (ns)": 95102505, "Max latency (ns)": 105485800, "Mean latency (ns)": 61573907, "Min duration satisfied": "Yes", "Min latency (ns)": 54907593, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 16.24, "QPS w/o loadgen overhead": 16.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 72.326317, "characteristics.90th_percentile_latency_ns": 72326317.0, "characteristics.90th_percentile_latency_s": 0.072326317, "characteristics.90th_percentile_latency_us": 72326.317, "characteristics.accuracy": 74.068, "characteristics.good": 37034, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4226bab02d432e1f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29539286, "90.00 percentile latency (ns)": 35360771, "90th percentile latency (ns)": 35360771, "95.00 percentile latency (ns)": 39617160, "97.00 percentile latency (ns)": 44002995, "99.00 percentile latency (ns)": 50493630, "99.90 percentile latency (ns)": 63975438, "Max latency (ns)": 164315790, "Mean latency (ns)": 31183859, "Min duration satisfied": "Yes", "Min latency (ns)": 28357151, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 32.05, "QPS w/o loadgen overhead": 32.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 35.360771, "characteristics.90th_percentile_latency_ns": 35360771.0, "characteristics.90th_percentile_latency_s": 0.035360771, "characteristics.90th_percentile_latency_us": 35360.771, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b0549cbb80aed739", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6327466, "90.00 percentile latency (ns)": 7908844, "90th percentile latency (ns)": 7908844, "95.00 percentile latency (ns)": 9372586, "97.00 percentile latency (ns)": 11300346, "99.00 percentile latency (ns)": 15070585, "99.90 percentile latency (ns)": 35135107, "Max latency (ns)": 78783884, "Mean latency (ns)": 6873879, "Min duration satisfied": "Yes", "Min latency (ns)": 5757778, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 145.08, "QPS w/o loadgen overhead": 145.48, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.908844, "characteristics.90th_percentile_latency_ns": 7908844.0, "characteristics.90th_percentile_latency_s": 0.007908844, "characteristics.90th_percentile_latency_us": 7908.844, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0f41cf495fb79400", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 97506718, "90.00 percentile latency (ns)": 113259554, "90th percentile latency (ns)": 113259554, "95.00 percentile latency (ns)": 122721896, "97.00 percentile latency (ns)": 127113205, "99.00 percentile latency (ns)": 141496133, "99.90 percentile latency (ns)": 180276888, "Max latency (ns)": 255672625, "Mean latency (ns)": 102362712, "Min duration satisfied": "Yes", "Min latency (ns)": 94462620, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 9.77, "QPS w/o loadgen overhead": 9.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 113.259554, "characteristics.90th_percentile_latency_ns": 113259554.0, "characteristics.90th_percentile_latency_s": 0.113259554, "characteristics.90th_percentile_latency_us": 113259.554, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5ad98d0b43a1aef9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 17502143, "90.00 percentile latency (ns)": 23585086, "90th percentile latency (ns)": 23585086, "95.00 percentile latency (ns)": 25470573, "97.00 percentile latency (ns)": 28040825, "99.00 percentile latency (ns)": 33824684, "99.90 percentile latency (ns)": 47010165, "Max latency (ns)": 65150799, "Mean latency (ns)": 18988429, "Min duration satisfied": "Yes", "Min latency (ns)": 16001952, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 52.63, "QPS w/o loadgen overhead": 52.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.585086, "characteristics.90th_percentile_latency_ns": 23585086.0, "characteristics.90th_percentile_latency_s": 0.023585086, "characteristics.90th_percentile_latency_us": 23585.086, "characteristics.accuracy": 70.338, "characteristics.good": 35169, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "50b6422116f1433a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16338158, "90.00 percentile latency (ns)": 21253340, "90th percentile latency (ns)": 21253340, "95.00 percentile latency (ns)": 23423031, "97.00 percentile latency (ns)": 25413163, "99.00 percentile latency (ns)": 33539680, "99.90 percentile latency (ns)": 52412312, "Max latency (ns)": 84448153, "Mean latency (ns)": 17639123, "Min duration satisfied": "Yes", "Min latency (ns)": 15678163, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 56.65, "QPS w/o loadgen overhead": 56.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.25334, "characteristics.90th_percentile_latency_ns": 21253340.0, "characteristics.90th_percentile_latency_s": 0.02125334, "characteristics.90th_percentile_latency_us": 21253.34, "characteristics.accuracy": 64.418, "characteristics.good": 32209, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "467a9b026e0c1f1f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40957059, "90.00 percentile latency (ns)": 49340966, "90th percentile latency (ns)": 49340966, "95.00 percentile latency (ns)": 56008890, "97.00 percentile latency (ns)": 58485452, "99.00 percentile latency (ns)": 66515422, "99.90 percentile latency (ns)": 77211469, "Max latency (ns)": 78658959, "Mean latency (ns)": 43344965, "Min duration satisfied": "Yes", "Min latency (ns)": 39655463, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 23.06, "QPS w/o loadgen overhead": 23.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 49.340966, "characteristics.90th_percentile_latency_ns": 49340966.0, "characteristics.90th_percentile_latency_s": 0.049340966, "characteristics.90th_percentile_latency_us": 49340.966, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b4707463a85f8fa5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 23600511, "90.00 percentile latency (ns)": 28984129, "90th percentile latency (ns)": 28984129, "95.00 percentile latency (ns)": 31835065, "97.00 percentile latency (ns)": 37067956, "99.00 percentile latency (ns)": 44921342, "99.90 percentile latency (ns)": 58894185, "Max latency (ns)": 128687035, "Mean latency (ns)": 25131132, "Min duration satisfied": "Yes", "Min latency (ns)": 22895585, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 39.76, "QPS w/o loadgen overhead": 39.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.984129, "characteristics.90th_percentile_latency_ns": 28984129.0, "characteristics.90th_percentile_latency_s": 0.028984129, "characteristics.90th_percentile_latency_us": 28984.129, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1f4c4b874a4b69f6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14655463, "90.00 percentile latency (ns)": 17205362, "90th percentile latency (ns)": 17205362, "95.00 percentile latency (ns)": 20220721, "97.00 percentile latency (ns)": 22246694, "99.00 percentile latency (ns)": 30490368, "99.90 percentile latency (ns)": 54279527, "Max latency (ns)": 66375971, "Mean latency (ns)": 15537731, "Min duration satisfied": "Yes", "Min latency (ns)": 13895943, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 64.26, "QPS w/o loadgen overhead": 64.36, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.205362, "characteristics.90th_percentile_latency_ns": 17205362.0, "characteristics.90th_percentile_latency_s": 0.017205362, "characteristics.90th_percentile_latency_us": 17205.362, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b07b877921844a2f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 27611100, "90.00 percentile latency (ns)": 38541909, "90th percentile latency (ns)": 38541909, "95.00 percentile latency (ns)": 42010037, "97.00 percentile latency (ns)": 44896443, "99.00 percentile latency (ns)": 50427706, "99.90 percentile latency (ns)": 59976756, "Max latency (ns)": 63085667, "Mean latency (ns)": 30446814, "Min duration satisfied": "Yes", "Min latency (ns)": 26191642, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 32.83, "QPS w/o loadgen overhead": 32.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 38.541909, "characteristics.90th_percentile_latency_ns": 38541909.0, "characteristics.90th_percentile_latency_s": 0.038541909, "characteristics.90th_percentile_latency_us": 38541.909, "characteristics.accuracy": 71.21, "characteristics.good": 35605, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6229042e9aadeb5d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 57922422, "90.00 percentile latency (ns)": 68535552, "90th percentile latency (ns)": 68535552, "95.00 percentile latency (ns)": 74074880, "97.00 percentile latency (ns)": 77838894, "99.00 percentile latency (ns)": 82354431, "99.90 percentile latency (ns)": 148132703, "Max latency (ns)": 225386769, "Mean latency (ns)": 60603657, "Min duration satisfied": "Yes", "Min latency (ns)": 56209670, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 16.49, "QPS w/o loadgen overhead": 16.5, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 68.535552, "characteristics.90th_percentile_latency_ns": 68535552.0, "characteristics.90th_percentile_latency_s": 0.068535552, "characteristics.90th_percentile_latency_us": 68535.552, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "20a593701dc4feda", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13647549, "90.00 percentile latency (ns)": 16904901, "90th percentile latency (ns)": 16904901, "95.00 percentile latency (ns)": 19688474, "97.00 percentile latency (ns)": 21209498, "99.00 percentile latency (ns)": 31082745, "99.90 percentile latency (ns)": 48630265, "Max latency (ns)": 91770123, "Mean latency (ns)": 14650017, "Min duration satisfied": "Yes", "Min latency (ns)": 12880445, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 68.19, "QPS w/o loadgen overhead": 68.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.904901, "characteristics.90th_percentile_latency_ns": 16904901.0, "characteristics.90th_percentile_latency_s": 0.016904901, "characteristics.90th_percentile_latency_us": 16904.901, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ff7b844f885e3e4d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 87100987, "90.00 percentile latency (ns)": 99125926, "90th percentile latency (ns)": 99125926, "95.00 percentile latency (ns)": 106335860, "97.00 percentile latency (ns)": 111894036, "99.00 percentile latency (ns)": 119242568, "99.90 percentile latency (ns)": 131003976, "Max latency (ns)": 152704628, "Mean latency (ns)": 90096365, "Min duration satisfied": "Yes", "Min latency (ns)": 81356850, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 11.1, "QPS w/o loadgen overhead": 11.1, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 99.125926, "characteristics.90th_percentile_latency_ns": 99125926.0, "characteristics.90th_percentile_latency_s": 0.099125926, "characteristics.90th_percentile_latency_us": 99125.926, "characteristics.accuracy": 76.374, "characteristics.good": 38187, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "eca1d102b3fa5df0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 27903572, "90.00 percentile latency (ns)": 33678534, "90th percentile latency (ns)": 33678534, "95.00 percentile latency (ns)": 37825108, "97.00 percentile latency (ns)": 41344776, "99.00 percentile latency (ns)": 48382191, "99.90 percentile latency (ns)": 56350366, "Max latency (ns)": 80168517, "Mean latency (ns)": 29540299, "Min duration satisfied": "Yes", "Min latency (ns)": 27011407, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 33.83, "QPS w/o loadgen overhead": 33.85, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.678534, "characteristics.90th_percentile_latency_ns": 33678534.0, "characteristics.90th_percentile_latency_s": 0.033678534, "characteristics.90th_percentile_latency_us": 33678.534, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a668180985bce458", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14591428, "90.00 percentile latency (ns)": 18125722, "90th percentile latency (ns)": 18125722, "95.00 percentile latency (ns)": 21509575, "97.00 percentile latency (ns)": 23979215, "99.00 percentile latency (ns)": 33027051, "99.90 percentile latency (ns)": 58677536, "Max latency (ns)": 119616928, "Mean latency (ns)": 15641153, "Min duration satisfied": "Yes", "Min latency (ns)": 13537592, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 63.86, "QPS w/o loadgen overhead": 63.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.125722, "characteristics.90th_percentile_latency_ns": 18125722.0, "characteristics.90th_percentile_latency_s": 0.018125722, "characteristics.90th_percentile_latency_us": 18125.722, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3c7db85641d494df", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 83210447, "90.00 percentile latency (ns)": 100684968, "90th percentile latency (ns)": 100684968, "95.00 percentile latency (ns)": 103251409, "97.00 percentile latency (ns)": 106101658, "99.00 percentile latency (ns)": 110610036, "99.90 percentile latency (ns)": 115629050, "Max latency (ns)": 115837452, "Mean latency (ns)": 88086049, "Min duration satisfied": "Yes", "Min latency (ns)": 81735204, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 11.34, "QPS w/o loadgen overhead": 11.35, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 100.684968, "characteristics.90th_percentile_latency_ns": 100684968.0, "characteristics.90th_percentile_latency_s": 0.100684968, "characteristics.90th_percentile_latency_us": 100684.968, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e4a40826bab49d9a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 215607422, "90.00 percentile latency (ns)": 239934122, "90th percentile latency (ns)": 239934122, "95.00 percentile latency (ns)": 248015010, "97.00 percentile latency (ns)": 254770264, "99.00 percentile latency (ns)": 268426290, "99.90 percentile latency (ns)": 322095703, "Max latency (ns)": 346056983, "Mean latency (ns)": 217388048, "Min duration satisfied": "Yes", "Min latency (ns)": 197405888, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 4.6, "QPS w/o loadgen overhead": 4.6, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 239.934122, "characteristics.90th_percentile_latency_ns": 239934122.0, "characteristics.90th_percentile_latency_s": 0.239934122, "characteristics.90th_percentile_latency_us": 239934.122, "characteristics.accuracy": 60.162, "characteristics.good": 30081, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ae63dae45d5904ac", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 24470867, "90.00 percentile latency (ns)": 29284568, "90th percentile latency (ns)": 29284568, "95.00 percentile latency (ns)": 31740122, "97.00 percentile latency (ns)": 33511877, "99.00 percentile latency (ns)": 37203344, "99.90 percentile latency (ns)": 43105872, "Max latency (ns)": 44473359, "Mean latency (ns)": 24643219, "Min duration satisfied": "Yes", "Min latency (ns)": 21498530, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 40.51, "QPS w/o loadgen overhead": 40.58, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.284568, "characteristics.90th_percentile_latency_ns": 29284568.0, "characteristics.90th_percentile_latency_s": 0.029284568, "characteristics.90th_percentile_latency_us": 29284.568, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c24a39724ca5bdd3", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 208693373, "90.00 percentile latency (ns)": 234464160, "90th percentile latency (ns)": 234464160, "95.00 percentile latency (ns)": 244618324, "97.00 percentile latency (ns)": 250338403, "99.00 percentile latency (ns)": 262426043, "99.90 percentile latency (ns)": 297178802, "Max latency (ns)": 320288023, "Mean latency (ns)": 210498890, "Min duration satisfied": "Yes", "Min latency (ns)": 190552185, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 4.75, "QPS w/o loadgen overhead": 4.75, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 234.46416, "characteristics.90th_percentile_latency_ns": 234464160.0, "characteristics.90th_percentile_latency_s": 0.23446416, "characteristics.90th_percentile_latency_us": 234464.16, "characteristics.accuracy": 68.734, "characteristics.good": 34367, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "581d9c00bf028bda", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 68251476, "90.00 percentile latency (ns)": 94042308, "90th percentile latency (ns)": 94042308, "95.00 percentile latency (ns)": 100997409, "97.00 percentile latency (ns)": 105042805, "99.00 percentile latency (ns)": 112865143, "99.90 percentile latency (ns)": 119409905, "Max latency (ns)": 121411540, "Mean latency (ns)": 75333991, "Min duration satisfied": "Yes", "Min latency (ns)": 67014490, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 13.26, "QPS w/o loadgen overhead": 13.27, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 94.042308, "characteristics.90th_percentile_latency_ns": 94042308.0, "characteristics.90th_percentile_latency_s": 0.094042308, "characteristics.90th_percentile_latency_us": 94042.308, "characteristics.accuracy": 54.864, "characteristics.good": 27432, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "92cdd497445f8553", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 54162521, "90.00 percentile latency (ns)": 68933853, "90th percentile latency (ns)": 68933853, "95.00 percentile latency (ns)": 73259911, "97.00 percentile latency (ns)": 75958675, "99.00 percentile latency (ns)": 80600817, "99.90 percentile latency (ns)": 84071155, "Max latency (ns)": 95665493, "Mean latency (ns)": 58127112, "Min duration satisfied": "Yes", "Min latency (ns)": 53008181, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 17.18, "QPS w/o loadgen overhead": 17.2, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 68.933853, "characteristics.90th_percentile_latency_ns": 68933853.0, "characteristics.90th_percentile_latency_s": 0.068933853, "characteristics.90th_percentile_latency_us": 68933.853, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "44b74b7be062e66a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 29936963, "90.00 percentile latency (ns)": 36092621, "90th percentile latency (ns)": 36092621, "95.00 percentile latency (ns)": 39281818, "97.00 percentile latency (ns)": 41210567, "99.00 percentile latency (ns)": 44275525, "99.90 percentile latency (ns)": 50293409, "Max latency (ns)": 51929703, "Mean latency (ns)": 29968781, "Min duration satisfied": "Yes", "Min latency (ns)": 25321135, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 33.31, "QPS w/o loadgen overhead": 33.37, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 36.092621, "characteristics.90th_percentile_latency_ns": 36092621.0, "characteristics.90th_percentile_latency_s": 0.036092621, "characteristics.90th_percentile_latency_us": 36092.621, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "40452bafc3a4bbc7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 429017040, "90.00 percentile latency (ns)": 458605090, "90th percentile latency (ns)": 458605090, "95.00 percentile latency (ns)": 471661954, "97.00 percentile latency (ns)": 478566175, "99.00 percentile latency (ns)": 498463100, "99.90 percentile latency (ns)": 546615963, "Max latency (ns)": 554997038, "Mean latency (ns)": 431263477, "Min duration satisfied": "Yes", "Min latency (ns)": 392388788, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.32, "QPS w/o loadgen overhead": 2.32, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 458.60509, "characteristics.90th_percentile_latency_ns": 458605090.0, "characteristics.90th_percentile_latency_s": 0.45860509, "characteristics.90th_percentile_latency_us": 458605.09, "characteristics.accuracy": 70.724, "characteristics.good": 35362, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "443ba79d8c48ab26", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 27284671, "90.00 percentile latency (ns)": 32812338, "90th percentile latency (ns)": 32812338, "95.00 percentile latency (ns)": 36139159, "97.00 percentile latency (ns)": 37746189, "99.00 percentile latency (ns)": 40924796, "99.90 percentile latency (ns)": 47332623, "Max latency (ns)": 50216178, "Mean latency (ns)": 27436967, "Min duration satisfied": "Yes", "Min latency (ns)": 23022264, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 36.38, "QPS w/o loadgen overhead": 36.45, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 32.812338, "characteristics.90th_percentile_latency_ns": 32812338.0, "characteristics.90th_percentile_latency_s": 0.032812338, "characteristics.90th_percentile_latency_us": 32812.338, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c0762d3414f0090d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 62696275, "90.00 percentile latency (ns)": 79807655, "90th percentile latency (ns)": 79807655, "95.00 percentile latency (ns)": 83630722, "97.00 percentile latency (ns)": 85573698, "99.00 percentile latency (ns)": 91936149, "99.90 percentile latency (ns)": 102672669, "Max latency (ns)": 109456921, "Mean latency (ns)": 67158415, "Min duration satisfied": "Yes", "Min latency (ns)": 61527260, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 14.88, "QPS w/o loadgen overhead": 14.89, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 79.807655, "characteristics.90th_percentile_latency_ns": 79807655.0, "characteristics.90th_percentile_latency_s": 0.079807655, "characteristics.90th_percentile_latency_us": 79807.655, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d6428f87468eb747", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 55186478, "90.00 percentile latency (ns)": 69144998, "90th percentile latency (ns)": 69144998, "95.00 percentile latency (ns)": 72334083, "97.00 percentile latency (ns)": 74251812, "99.00 percentile latency (ns)": 78824827, "99.90 percentile latency (ns)": 85604379, "Max latency (ns)": 87197801, "Mean latency (ns)": 58639268, "Min duration satisfied": "Yes", "Min latency (ns)": 54139153, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 17.04, "QPS w/o loadgen overhead": 17.05, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 69.144998, "characteristics.90th_percentile_latency_ns": 69144998.0, "characteristics.90th_percentile_latency_s": 0.069144998, "characteristics.90th_percentile_latency_us": 69144.998, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1aa490b8cd97a021", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6319313, "90.00 percentile latency (ns)": 8599557, "90th percentile latency (ns)": 8599557, "95.00 percentile latency (ns)": 10511823, "97.00 percentile latency (ns)": 11830532, "99.00 percentile latency (ns)": 17841703, "99.90 percentile latency (ns)": 46011130, "Max latency (ns)": 80249201, "Mean latency (ns)": 7078489, "Min duration satisfied": "Yes", "Min latency (ns)": 5882431, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 140.89, "QPS w/o loadgen overhead": 141.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.599557, "characteristics.90th_percentile_latency_ns": 8599557.0, "characteristics.90th_percentile_latency_s": 0.008599557, "characteristics.90th_percentile_latency_us": 8599.557, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4d37bf604c6d14b6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7803050, "90.00 percentile latency (ns)": 11625340, "90th percentile latency (ns)": 11625340, "95.00 percentile latency (ns)": 13860884, "97.00 percentile latency (ns)": 14961391, "99.00 percentile latency (ns)": 20246187, "99.90 percentile latency (ns)": 44565848, "Max latency (ns)": 120869450, "Mean latency (ns)": 8808229, "Min duration satisfied": "Yes", "Min latency (ns)": 6941753, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 113.27, "QPS w/o loadgen overhead": 113.53, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.62534, "characteristics.90th_percentile_latency_ns": 11625340.0, "characteristics.90th_percentile_latency_s": 0.01162534, "characteristics.90th_percentile_latency_us": 11625.34, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a45415689687f124", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 76534871, "90.00 percentile latency (ns)": 91953171, "90th percentile latency (ns)": 91953171, "95.00 percentile latency (ns)": 96283215, "97.00 percentile latency (ns)": 100198712, "99.00 percentile latency (ns)": 108694121, "99.90 percentile latency (ns)": 129791035, "Max latency (ns)": 164958288, "Mean latency (ns)": 79512302, "Min duration satisfied": "Yes", "Min latency (ns)": 69339039, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 12.57, "QPS w/o loadgen overhead": 12.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 91.953171, "characteristics.90th_percentile_latency_ns": 91953171.0, "characteristics.90th_percentile_latency_s": 0.091953171, "characteristics.90th_percentile_latency_us": 91953.171, "characteristics.accuracy": 78.504, "characteristics.good": 39252, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a42ae8311da18a6d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7116718, "90.00 percentile latency (ns)": 11651171, "90th percentile latency (ns)": 11651171, "95.00 percentile latency (ns)": 13608762, "97.00 percentile latency (ns)": 14613457, "99.00 percentile latency (ns)": 18858979, "99.90 percentile latency (ns)": 37740200, "Max latency (ns)": 109602132, "Mean latency (ns)": 8247080, "Min duration satisfied": "Yes", "Min latency (ns)": 6182423, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 121.13, "QPS w/o loadgen overhead": 121.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.651171, "characteristics.90th_percentile_latency_ns": 11651171.0, "characteristics.90th_percentile_latency_s": 0.011651171, "characteristics.90th_percentile_latency_us": 11651.171, "characteristics.accuracy": 63.654, "characteristics.good": 31827, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "18964eeba058bfec", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2519631, "90.00 percentile latency (ns)": 3614495, "90th percentile latency (ns)": 3614495, "95.00 percentile latency (ns)": 4683342, "97.00 percentile latency (ns)": 5650649, "99.00 percentile latency (ns)": 8124934, "99.90 percentile latency (ns)": 22748970, "Max latency (ns)": 105268348, "Mean latency (ns)": 2861830, "Min duration satisfied": "Yes", "Min latency (ns)": 2073275, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 348.23, "QPS w/o loadgen overhead": 349.43, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.614495, "characteristics.90th_percentile_latency_ns": 3614495.0, "characteristics.90th_percentile_latency_s": 0.003614495, "characteristics.90th_percentile_latency_us": 3614.495, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "273844a38af0a1e2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2688182, "90.00 percentile latency (ns)": 3896044, "90th percentile latency (ns)": 3896044, "95.00 percentile latency (ns)": 5191461, "97.00 percentile latency (ns)": 6308406, "99.00 percentile latency (ns)": 8949227, "99.90 percentile latency (ns)": 23312100, "Max latency (ns)": 133456990, "Mean latency (ns)": 3049344, "Min duration satisfied": "Yes", "Min latency (ns)": 2162239, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 326.52, "QPS w/o loadgen overhead": 327.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.896044, "characteristics.90th_percentile_latency_ns": 3896044.0, "characteristics.90th_percentile_latency_s": 0.003896044, "characteristics.90th_percentile_latency_us": 3896.044, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "208a2122ef41944a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4622217, "90.00 percentile latency (ns)": 6247279, "90th percentile latency (ns)": 6247279, "95.00 percentile latency (ns)": 7666702, "97.00 percentile latency (ns)": 8842112, "99.00 percentile latency (ns)": 12040811, "99.90 percentile latency (ns)": 28743522, "Max latency (ns)": 114768287, "Mean latency (ns)": 5128324, "Min duration satisfied": "Yes", "Min latency (ns)": 4046960, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 194.37, "QPS w/o loadgen overhead": 195.0, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.247279, "characteristics.90th_percentile_latency_ns": 6247279.0, "characteristics.90th_percentile_latency_s": 0.006247279, "characteristics.90th_percentile_latency_us": 6247.279, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ba77614c97f4de2a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2677858, "90.00 percentile latency (ns)": 3870332, "90th percentile latency (ns)": 3870332, "95.00 percentile latency (ns)": 4929743, "97.00 percentile latency (ns)": 5819707, "99.00 percentile latency (ns)": 8151627, "99.90 percentile latency (ns)": 21764994, "Max latency (ns)": 36036625, "Mean latency (ns)": 3046175, "Min duration satisfied": "Yes", "Min latency (ns)": 2243309, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 327.79, "QPS w/o loadgen overhead": 328.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.870332, "characteristics.90th_percentile_latency_ns": 3870332.0, "characteristics.90th_percentile_latency_s": 0.003870332, "characteristics.90th_percentile_latency_us": 3870.332, "characteristics.accuracy": 48.11, "characteristics.good": 24055, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "85a424bbf0712e28", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11309707, "90.00 percentile latency (ns)": 16076890, "90th percentile latency (ns)": 16076890, "95.00 percentile latency (ns)": 18406751, "97.00 percentile latency (ns)": 19380937, "99.00 percentile latency (ns)": 26650788, "99.90 percentile latency (ns)": 39948742, "Max latency (ns)": 46635911, "Mean latency (ns)": 12460711, "Min duration satisfied": "Yes", "Min latency (ns)": 10483719, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 80.09, "QPS w/o loadgen overhead": 80.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.07689, "characteristics.90th_percentile_latency_ns": 16076890.0, "characteristics.90th_percentile_latency_s": 0.01607689, "characteristics.90th_percentile_latency_us": 16076.89, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8ca412998c1e99bc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3233530, "90.00 percentile latency (ns)": 4640029, "90th percentile latency (ns)": 4640029, "95.00 percentile latency (ns)": 5769234, "97.00 percentile latency (ns)": 6742272, "99.00 percentile latency (ns)": 9293241, "99.90 percentile latency (ns)": 23914704, "Max latency (ns)": 53173117, "Mean latency (ns)": 3599549, "Min duration satisfied": "Yes", "Min latency (ns)": 2653982, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 277.3, "QPS w/o loadgen overhead": 277.81, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.640029, "characteristics.90th_percentile_latency_ns": 4640029.0, "characteristics.90th_percentile_latency_s": 0.004640029, "characteristics.90th_percentile_latency_us": 4640.029, "characteristics.accuracy": 50.24, "characteristics.good": 25120, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4ec4851a0d52f77d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3131213, "90.00 percentile latency (ns)": 4273707, "90th percentile latency (ns)": 4273707, "95.00 percentile latency (ns)": 5382467, "97.00 percentile latency (ns)": 6294587, "99.00 percentile latency (ns)": 9048586, "99.90 percentile latency (ns)": 23794108, "Max latency (ns)": 65892522, "Mean latency (ns)": 3502845, "Min duration satisfied": "Yes", "Min latency (ns)": 2841864, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 284.37, "QPS w/o loadgen overhead": 285.48, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.273707, "characteristics.90th_percentile_latency_ns": 4273707.0, "characteristics.90th_percentile_latency_s": 0.004273707, "characteristics.90th_percentile_latency_us": 4273.707, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c3dd21415d8b02cd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5764510, "90.00 percentile latency (ns)": 8897577, "90th percentile latency (ns)": 8897577, "95.00 percentile latency (ns)": 10930466, "97.00 percentile latency (ns)": 12369410, "99.00 percentile latency (ns)": 14737707, "99.90 percentile latency (ns)": 35751819, "Max latency (ns)": 122493251, "Mean latency (ns)": 6644058, "Min duration satisfied": "Yes", "Min latency (ns)": 5365453, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 150.13, "QPS w/o loadgen overhead": 150.51, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.897577, "characteristics.90th_percentile_latency_ns": 8897577.0, "characteristics.90th_percentile_latency_s": 0.008897577, "characteristics.90th_percentile_latency_us": 8897.577, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f5376b324639a528", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22496816, "90.00 percentile latency (ns)": 32303291, "90th percentile latency (ns)": 32303291, "95.00 percentile latency (ns)": 34802663, "97.00 percentile latency (ns)": 37249905, "99.00 percentile latency (ns)": 44876125, "99.90 percentile latency (ns)": 56138949, "Max latency (ns)": 68694886, "Mean latency (ns)": 25530847, "Min duration satisfied": "Yes", "Min latency (ns)": 19484014, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 39.14, "QPS w/o loadgen overhead": 39.17, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 32.303291, "characteristics.90th_percentile_latency_ns": 32303291.0, "characteristics.90th_percentile_latency_s": 0.032303291, "characteristics.90th_percentile_latency_us": 32303.291, "characteristics.accuracy": 74.022, "characteristics.good": 37011, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "da33a85e4d7d33c1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5572061, "90.00 percentile latency (ns)": 9445243, "90th percentile latency (ns)": 9445243, "95.00 percentile latency (ns)": 10905206, "97.00 percentile latency (ns)": 12093465, "99.00 percentile latency (ns)": 14004118, "99.90 percentile latency (ns)": 33483280, "Max latency (ns)": 118307407, "Mean latency (ns)": 6555298, "Min duration satisfied": "Yes", "Min latency (ns)": 4862191, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 152.38, "QPS w/o loadgen overhead": 152.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.445243, "characteristics.90th_percentile_latency_ns": 9445243.0, "characteristics.90th_percentile_latency_s": 0.009445243, "characteristics.90th_percentile_latency_us": 9445.243, "characteristics.accuracy": 61.906, "characteristics.good": 30953, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dfa1449d904de3b1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5783955, "90.00 percentile latency (ns)": 9376075, "90th percentile latency (ns)": 9376075, "95.00 percentile latency (ns)": 10935500, "97.00 percentile latency (ns)": 11983129, "99.00 percentile latency (ns)": 13917354, "99.90 percentile latency (ns)": 33448226, "Max latency (ns)": 71429760, "Mean latency (ns)": 6783730, "Min duration satisfied": "Yes", "Min latency (ns)": 5055348, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 147.22, "QPS w/o loadgen overhead": 147.41, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.376075, "characteristics.90th_percentile_latency_ns": 9376075.0, "characteristics.90th_percentile_latency_s": 0.009376075, "characteristics.90th_percentile_latency_us": 9376.075, "characteristics.accuracy": 62.27, "characteristics.good": 31135, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "144f2ab6e83f5bd6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2827229, "90.00 percentile latency (ns)": 4201465, "90th percentile latency (ns)": 4201465, "95.00 percentile latency (ns)": 5330923, "97.00 percentile latency (ns)": 6233010, "99.00 percentile latency (ns)": 8864102, "99.90 percentile latency (ns)": 23702069, "Max latency (ns)": 99642855, "Mean latency (ns)": 3247582, "Min duration satisfied": "Yes", "Min latency (ns)": 2567825, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 307.43, "QPS w/o loadgen overhead": 307.92, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.201465, "characteristics.90th_percentile_latency_ns": 4201465.0, "characteristics.90th_percentile_latency_s": 0.004201465, "characteristics.90th_percentile_latency_us": 4201.465, "characteristics.accuracy": 49.216, "characteristics.good": 24608, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "01a3b44802993032", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21575323, "90.00 percentile latency (ns)": 29254159, "90th percentile latency (ns)": 29254159, "95.00 percentile latency (ns)": 31454193, "97.00 percentile latency (ns)": 33310690, "99.00 percentile latency (ns)": 41318789, "99.90 percentile latency (ns)": 85139834, "Max latency (ns)": 131233234, "Mean latency (ns)": 23561193, "Min duration satisfied": "Yes", "Min latency (ns)": 19565858, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 42.42, "QPS w/o loadgen overhead": 42.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.254159, "characteristics.90th_percentile_latency_ns": 29254159.0, "characteristics.90th_percentile_latency_s": 0.029254159, "characteristics.90th_percentile_latency_us": 29254.159, "characteristics.accuracy": 73.508, "characteristics.good": 36754, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b72a6861a5147ed9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15366679, "90.00 percentile latency (ns)": 20376978, "90th percentile latency (ns)": 20376978, "95.00 percentile latency (ns)": 21759508, "97.00 percentile latency (ns)": 23140521, "99.00 percentile latency (ns)": 31410185, "99.90 percentile latency (ns)": 68464635, "Max latency (ns)": 81959516, "Mean latency (ns)": 16514718, "Min duration satisfied": "Yes", "Min latency (ns)": 14112529, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 60.5, "QPS w/o loadgen overhead": 60.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.376978, "characteristics.90th_percentile_latency_ns": 20376978.0, "characteristics.90th_percentile_latency_s": 0.020376978, "characteristics.90th_percentile_latency_us": 20376.978, "characteristics.accuracy": 70.762, "characteristics.good": 35381, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f2c5de6479b45d2a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1893146, "90.00 percentile latency (ns)": 2517880, "90th percentile latency (ns)": 2517880, "95.00 percentile latency (ns)": 3307453, "97.00 percentile latency (ns)": 3924730, "99.00 percentile latency (ns)": 5674093, "99.90 percentile latency (ns)": 19700326, "Max latency (ns)": 30438849, "Mean latency (ns)": 2123025, "Min duration satisfied": "Yes", "Min latency (ns)": 1653934, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 469.71, "QPS w/o loadgen overhead": 471.03, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.51788, "characteristics.90th_percentile_latency_ns": 2517880.0, "characteristics.90th_percentile_latency_s": 0.00251788, "characteristics.90th_percentile_latency_us": 2517.88, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "55964119841ced31", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3716622, "90.00 percentile latency (ns)": 5373742, "90th percentile latency (ns)": 5373742, "95.00 percentile latency (ns)": 6821031, "97.00 percentile latency (ns)": 8236729, "99.00 percentile latency (ns)": 11200933, "99.90 percentile latency (ns)": 26222162, "Max latency (ns)": 122692633, "Mean latency (ns)": 4253025, "Min duration satisfied": "Yes", "Min latency (ns)": 3273226, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 234.15, "QPS w/o loadgen overhead": 235.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.373742, "characteristics.90th_percentile_latency_ns": 5373742.0, "characteristics.90th_percentile_latency_s": 0.005373742, "characteristics.90th_percentile_latency_us": 5373.742, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4900aba52c6f11ac", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3187511, "90.00 percentile latency (ns)": 4148805, "90th percentile latency (ns)": 4148805, "95.00 percentile latency (ns)": 5198680, "97.00 percentile latency (ns)": 6027167, "99.00 percentile latency (ns)": 8309899, "99.90 percentile latency (ns)": 21227186, "Max latency (ns)": 63319268, "Mean latency (ns)": 3509267, "Min duration satisfied": "Yes", "Min latency (ns)": 2818246, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 284.17, "QPS w/o loadgen overhead": 284.96, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.148805, "characteristics.90th_percentile_latency_ns": 4148805.0, "characteristics.90th_percentile_latency_s": 0.004148805, "characteristics.90th_percentile_latency_us": 4148.805, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "93c4ed644c388ec2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4472900, "90.00 percentile latency (ns)": 6935440, "90th percentile latency (ns)": 6935440, "95.00 percentile latency (ns)": 8647707, "97.00 percentile latency (ns)": 9831150, "99.00 percentile latency (ns)": 12186038, "99.90 percentile latency (ns)": 27060994, "Max latency (ns)": 114483803, "Mean latency (ns)": 5142500, "Min duration satisfied": "Yes", "Min latency (ns)": 3800455, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 194.19, "QPS w/o loadgen overhead": 194.46, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.93544, "characteristics.90th_percentile_latency_ns": 6935440.0, "characteristics.90th_percentile_latency_s": 0.00693544, "characteristics.90th_percentile_latency_us": 6935.44, "characteristics.accuracy": 59.186, "characteristics.good": 29593, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0198ce4a6580c621", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9037553, "90.00 percentile latency (ns)": 12112325, "90th percentile latency (ns)": 12112325, "95.00 percentile latency (ns)": 14283257, "97.00 percentile latency (ns)": 15346943, "99.00 percentile latency (ns)": 20586777, "99.90 percentile latency (ns)": 35114632, "Max latency (ns)": 68979298, "Mean latency (ns)": 9888541, "Min duration satisfied": "Yes", "Min latency (ns)": 8590658, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 101.02, "QPS w/o loadgen overhead": 101.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.112325, "characteristics.90th_percentile_latency_ns": 12112325.0, "characteristics.90th_percentile_latency_s": 0.012112325, "characteristics.90th_percentile_latency_us": 12112.325, "characteristics.accuracy": 68.2, "characteristics.good": 34100, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "44bc8522bb392997", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4110606, "90.00 percentile latency (ns)": 7091436, "90th percentile latency (ns)": 7091436, "95.00 percentile latency (ns)": 8489736, "97.00 percentile latency (ns)": 9636248, "99.00 percentile latency (ns)": 11994941, "99.90 percentile latency (ns)": 31306318, "Max latency (ns)": 99122440, "Mean latency (ns)": 4936553, "Min duration satisfied": "Yes", "Min latency (ns)": 3777503, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 202.27, "QPS w/o loadgen overhead": 202.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.091436, "characteristics.90th_percentile_latency_ns": 7091436.0, "characteristics.90th_percentile_latency_s": 0.007091436, "characteristics.90th_percentile_latency_us": 7091.436, "characteristics.accuracy": 59.13, "characteristics.good": 29565, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7d2ae49838182919", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4470135, "90.00 percentile latency (ns)": 6331537, "90th percentile latency (ns)": 6331537, "95.00 percentile latency (ns)": 7829273, "97.00 percentile latency (ns)": 8915661, "99.00 percentile latency (ns)": 11433605, "99.90 percentile latency (ns)": 25646001, "Max latency (ns)": 56610686, "Mean latency (ns)": 4987947, "Min duration satisfied": "Yes", "Min latency (ns)": 4076932, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 200.2, "QPS w/o loadgen overhead": 200.48, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.331537, "characteristics.90th_percentile_latency_ns": 6331537.0, "characteristics.90th_percentile_latency_s": 0.006331537, "characteristics.90th_percentile_latency_us": 6331.537, "characteristics.accuracy": 58.39, "characteristics.good": 29195, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "340a583761541bb4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12359306, "90.00 percentile latency (ns)": 18156845, "90th percentile latency (ns)": 18156845, "95.00 percentile latency (ns)": 19880867, "97.00 percentile latency (ns)": 22736050, "99.00 percentile latency (ns)": 29132499, "99.90 percentile latency (ns)": 40846620, "Max latency (ns)": 59852948, "Mean latency (ns)": 13788862, "Min duration satisfied": "Yes", "Min latency (ns)": 11220625, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 72.44, "QPS w/o loadgen overhead": 72.52, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.156845, "characteristics.90th_percentile_latency_ns": 18156845.0, "characteristics.90th_percentile_latency_s": 0.018156845, "characteristics.90th_percentile_latency_us": 18156.845, "characteristics.accuracy": 72.9, "characteristics.good": 36450, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "37d3d5434b7ea9d1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13305588, "90.00 percentile latency (ns)": 19969889, "90th percentile latency (ns)": 19969889, "95.00 percentile latency (ns)": 21741210, "97.00 percentile latency (ns)": 24222880, "99.00 percentile latency (ns)": 31182303, "99.90 percentile latency (ns)": 54510055, "Max latency (ns)": 115854555, "Mean latency (ns)": 14940898, "Min duration satisfied": "Yes", "Min latency (ns)": 11571716, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 66.88, "QPS w/o loadgen overhead": 66.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.969889, "characteristics.90th_percentile_latency_ns": 19969889.0, "characteristics.90th_percentile_latency_s": 0.019969889, "characteristics.90th_percentile_latency_us": 19969.889, "characteristics.accuracy": 70.616, "characteristics.good": 35308, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9d509664ae5bfaaa", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4606155, "90.00 percentile latency (ns)": 6791786, "90th percentile latency (ns)": 6791786, "95.00 percentile latency (ns)": 8718175, "97.00 percentile latency (ns)": 10034457, "99.00 percentile latency (ns)": 12665709, "99.90 percentile latency (ns)": 31054580, "Max latency (ns)": 108865970, "Mean latency (ns)": 5269563, "Min duration satisfied": "Yes", "Min latency (ns)": 4208377, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 189.55, "QPS w/o loadgen overhead": 189.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.791786, "characteristics.90th_percentile_latency_ns": 6791786.0, "characteristics.90th_percentile_latency_s": 0.006791786, "characteristics.90th_percentile_latency_us": 6791.786, "characteristics.accuracy": 56.52, "characteristics.good": 28260, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4ee9405889a31c34", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7876157, "90.00 percentile latency (ns)": 13103363, "90th percentile latency (ns)": 13103363, "95.00 percentile latency (ns)": 14944916, "97.00 percentile latency (ns)": 15675541, "99.00 percentile latency (ns)": 19504670, "99.90 percentile latency (ns)": 34734464, "Max latency (ns)": 120611252, "Mean latency (ns)": 9138975, "Min duration satisfied": "Yes", "Min latency (ns)": 6858639, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 109.3, "QPS w/o loadgen overhead": 109.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.103363, "characteristics.90th_percentile_latency_ns": 13103363.0, "characteristics.90th_percentile_latency_s": 0.013103363, "characteristics.90th_percentile_latency_us": 13103.363, "characteristics.accuracy": 67.71, "characteristics.good": 33855, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f70a317b0f14d9aa", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1476220, "90.00 percentile latency (ns)": 1996424, "90th percentile latency (ns)": 1996424, "95.00 percentile latency (ns)": 2660948, "97.00 percentile latency (ns)": 3279232, "99.00 percentile latency (ns)": 4735099, "99.90 percentile latency (ns)": 20120640, "Max latency (ns)": 58347527, "Mean latency (ns)": 1683990, "Min duration satisfied": "Yes", "Min latency (ns)": 1338328, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 591.95, "QPS w/o loadgen overhead": 593.83, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 1.996424, "characteristics.90th_percentile_latency_ns": 1996424.0, "characteristics.90th_percentile_latency_s": 0.001996424, "characteristics.90th_percentile_latency_us": 1996.424, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b58c0a0a971457eb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1954016, "90.00 percentile latency (ns)": 3229593, "90th percentile latency (ns)": 3229593, "95.00 percentile latency (ns)": 4168869, "97.00 percentile latency (ns)": 4971211, "99.00 percentile latency (ns)": 6910439, "99.90 percentile latency (ns)": 21085745, "Max latency (ns)": 53692397, "Mean latency (ns)": 2336765, "Min duration satisfied": "Yes", "Min latency (ns)": 1729298, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 427.0, "QPS w/o loadgen overhead": 427.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.229593, "characteristics.90th_percentile_latency_ns": 3229593.0, "characteristics.90th_percentile_latency_s": 0.003229593, "characteristics.90th_percentile_latency_us": 3229.593, "characteristics.accuracy": 45.454, "characteristics.good": 22727, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "81e75499b34684a5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8899321, "90.00 percentile latency (ns)": 11511577, "90th percentile latency (ns)": 11511577, "95.00 percentile latency (ns)": 13454073, "97.00 percentile latency (ns)": 14744697, "99.00 percentile latency (ns)": 19501416, "99.90 percentile latency (ns)": 30861620, "Max latency (ns)": 53537947, "Mean latency (ns)": 9634645, "Min duration satisfied": "Yes", "Min latency (ns)": 8355295, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 103.58, "QPS w/o loadgen overhead": 103.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.511577, "characteristics.90th_percentile_latency_ns": 11511577.0, "characteristics.90th_percentile_latency_s": 0.011511577, "characteristics.90th_percentile_latency_us": 11511.577, "characteristics.accuracy": 70.626, "characteristics.good": 35313, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0c4fb9aa2a02c577", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6019059, "90.00 percentile latency (ns)": 9896324, "90th percentile latency (ns)": 9896324, "95.00 percentile latency (ns)": 11624083, "97.00 percentile latency (ns)": 12788136, "99.00 percentile latency (ns)": 14925929, "99.90 percentile latency (ns)": 28639772, "Max latency (ns)": 38771656, "Mean latency (ns)": 6952048, "Min duration satisfied": "Yes", "Min latency (ns)": 5274353, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 143.7, "QPS w/o loadgen overhead": 143.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.896324, "characteristics.90th_percentile_latency_ns": 9896324.0, "characteristics.90th_percentile_latency_s": 0.009896324, "characteristics.90th_percentile_latency_us": 9896.324, "characteristics.accuracy": 63.44, "characteristics.good": 31720, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "07a8ec7142e4cbb6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11739905, "90.00 percentile latency (ns)": 16014770, "90th percentile latency (ns)": 16014770, "95.00 percentile latency (ns)": 17668131, "97.00 percentile latency (ns)": 18584337, "99.00 percentile latency (ns)": 26289998, "99.90 percentile latency (ns)": 38803667, "Max latency (ns)": 76836617, "Mean latency (ns)": 12794292, "Min duration satisfied": "Yes", "Min latency (ns)": 10703628, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 78.08, "QPS w/o loadgen overhead": 78.16, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.01477, "characteristics.90th_percentile_latency_ns": 16014770.0, "characteristics.90th_percentile_latency_s": 0.01601477, "characteristics.90th_percentile_latency_us": 16014.77, "characteristics.accuracy": 70.016, "characteristics.good": 35008, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f14647a0d4b20ba8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29080590, "90.00 percentile latency (ns)": 40187217, "90th percentile latency (ns)": 40187217, "95.00 percentile latency (ns)": 43505089, "97.00 percentile latency (ns)": 49266555, "99.00 percentile latency (ns)": 55577164, "99.90 percentile latency (ns)": 69799062, "Max latency (ns)": 81442704, "Mean latency (ns)": 32489960, "Min duration satisfied": "Yes", "Min latency (ns)": 26651781, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 30.76, "QPS w/o loadgen overhead": 30.78, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.187217, "characteristics.90th_percentile_latency_ns": 40187217.0, "characteristics.90th_percentile_latency_s": 0.040187217, "characteristics.90th_percentile_latency_us": 40187.217, "characteristics.accuracy": 74.068, "characteristics.good": 37034, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bc26729dcbd046db", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3488734, "90.00 percentile latency (ns)": 5621787, "90th percentile latency (ns)": 5621787, "95.00 percentile latency (ns)": 6954237, "97.00 percentile latency (ns)": 7928154, "99.00 percentile latency (ns)": 10166009, "99.90 percentile latency (ns)": 26821073, "Max latency (ns)": 63135039, "Mean latency (ns)": 4112765, "Min duration satisfied": "Yes", "Min latency (ns)": 3122422, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 242.76, "QPS w/o loadgen overhead": 243.15, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.621787, "characteristics.90th_percentile_latency_ns": 5621787.0, "characteristics.90th_percentile_latency_s": 0.005621787, "characteristics.90th_percentile_latency_us": 5621.787, "characteristics.accuracy": 59.422, "characteristics.good": 29711, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ad2e284f345e3869", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4455248, "90.00 percentile latency (ns)": 7241188, "90th percentile latency (ns)": 7241188, "95.00 percentile latency (ns)": 8905148, "97.00 percentile latency (ns)": 10105600, "99.00 percentile latency (ns)": 12138273, "99.90 percentile latency (ns)": 30359803, "Max latency (ns)": 64183906, "Mean latency (ns)": 5226593, "Min duration satisfied": "Yes", "Min latency (ns)": 4039521, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 191.1, "QPS w/o loadgen overhead": 191.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.241188, "characteristics.90th_percentile_latency_ns": 7241188.0, "characteristics.90th_percentile_latency_s": 0.007241188, "characteristics.90th_percentile_latency_us": 7241.188, "characteristics.accuracy": 61.462, "characteristics.good": 30731, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "35567e0437c99c9f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5742618, "90.00 percentile latency (ns)": 9361528, "90th percentile latency (ns)": 9361528, "95.00 percentile latency (ns)": 10960926, "97.00 percentile latency (ns)": 12306809, "99.00 percentile latency (ns)": 14560347, "99.90 percentile latency (ns)": 38417130, "Max latency (ns)": 104191933, "Mean latency (ns)": 6697713, "Min duration satisfied": "Yes", "Min latency (ns)": 5137568, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 149.12, "QPS w/o loadgen overhead": 149.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.361528, "characteristics.90th_percentile_latency_ns": 9361528.0, "characteristics.90th_percentile_latency_s": 0.009361528, "characteristics.90th_percentile_latency_us": 9361.528, "characteristics.accuracy": 58.51, "characteristics.good": 29255, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "93237056204d3cb9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4227362, "90.00 percentile latency (ns)": 6151514, "90th percentile latency (ns)": 6151514, "95.00 percentile latency (ns)": 7677599, "97.00 percentile latency (ns)": 9052862, "99.00 percentile latency (ns)": 11870528, "99.90 percentile latency (ns)": 30810945, "Max latency (ns)": 109356690, "Mean latency (ns)": 4811570, "Min duration satisfied": "Yes", "Min latency (ns)": 3845008, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 207.17, "QPS w/o loadgen overhead": 207.83, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.151514, "characteristics.90th_percentile_latency_ns": 6151514.0, "characteristics.90th_percentile_latency_s": 0.006151514, "characteristics.90th_percentile_latency_us": 6151.514, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "49bea74826885eba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15880113, "90.00 percentile latency (ns)": 23006950, "90th percentile latency (ns)": 23006950, "95.00 percentile latency (ns)": 25921285, "97.00 percentile latency (ns)": 27670929, "99.00 percentile latency (ns)": 34621696, "99.90 percentile latency (ns)": 44322372, "Max latency (ns)": 79610432, "Mean latency (ns)": 17879075, "Min duration satisfied": "Yes", "Min latency (ns)": 14882406, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 55.86, "QPS w/o loadgen overhead": 55.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.00695, "characteristics.90th_percentile_latency_ns": 23006950.0, "characteristics.90th_percentile_latency_s": 0.02300695, "characteristics.90th_percentile_latency_us": 23006.95, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a59fd5724f489d36", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10124379, "90.00 percentile latency (ns)": 16534358, "90th percentile latency (ns)": 16534358, "95.00 percentile latency (ns)": 17887740, "97.00 percentile latency (ns)": 18980921, "99.00 percentile latency (ns)": 25210985, "99.90 percentile latency (ns)": 41784823, "Max latency (ns)": 110347361, "Mean latency (ns)": 11779488, "Min duration satisfied": "Yes", "Min latency (ns)": 8933467, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 84.81, "QPS w/o loadgen overhead": 84.89, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.534358, "characteristics.90th_percentile_latency_ns": 16534358.0, "characteristics.90th_percentile_latency_s": 0.016534358, "characteristics.90th_percentile_latency_us": 16534.358, "characteristics.accuracy": 69.582, "characteristics.good": 34791, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "198d5b09478e992d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8618782, "90.00 percentile latency (ns)": 12443801, "90th percentile latency (ns)": 12443801, "95.00 percentile latency (ns)": 14236512, "97.00 percentile latency (ns)": 15268009, "99.00 percentile latency (ns)": 20254166, "99.90 percentile latency (ns)": 33781051, "Max latency (ns)": 70173976, "Mean latency (ns)": 9562568, "Min duration satisfied": "Yes", "Min latency (ns)": 8020774, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 104.35, "QPS w/o loadgen overhead": 104.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.443801, "characteristics.90th_percentile_latency_ns": 12443801.0, "characteristics.90th_percentile_latency_s": 0.012443801, "characteristics.90th_percentile_latency_us": 12443.801, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7f4a84bb357fba04", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10840342, "90.00 percentile latency (ns)": 17488599, "90th percentile latency (ns)": 17488599, "95.00 percentile latency (ns)": 18887955, "97.00 percentile latency (ns)": 20888104, "99.00 percentile latency (ns)": 26100490, "99.90 percentile latency (ns)": 44562413, "Max latency (ns)": 94069515, "Mean latency (ns)": 12602974, "Min duration satisfied": "Yes", "Min latency (ns)": 9603744, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 79.27, "QPS w/o loadgen overhead": 79.35, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.488599, "characteristics.90th_percentile_latency_ns": 17488599.0, "characteristics.90th_percentile_latency_s": 0.017488599, "characteristics.90th_percentile_latency_us": 17488.599, "characteristics.accuracy": 68.666, "characteristics.good": 34333, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b5b3bff7b9d2e646", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4005608, "90.00 percentile latency (ns)": 5684381, "90th percentile latency (ns)": 5684381, "95.00 percentile latency (ns)": 6987774, "97.00 percentile latency (ns)": 8086004, "99.00 percentile latency (ns)": 10757530, "99.90 percentile latency (ns)": 26228448, "Max latency (ns)": 51784511, "Mean latency (ns)": 4488548, "Min duration satisfied": "Yes", "Min latency (ns)": 3437580, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 221.96, "QPS w/o loadgen overhead": 222.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.684381, "characteristics.90th_percentile_latency_ns": 5684381.0, "characteristics.90th_percentile_latency_s": 0.005684381, "characteristics.90th_percentile_latency_us": 5684.381, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9b98655fdbc422ea", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2318287, "90.00 percentile latency (ns)": 2909419, "90th percentile latency (ns)": 2909419, "95.00 percentile latency (ns)": 3876825, "97.00 percentile latency (ns)": 4601500, "99.00 percentile latency (ns)": 7063987, "99.90 percentile latency (ns)": 20438995, "Max latency (ns)": 54979398, "Mean latency (ns)": 2582301, "Min duration satisfied": "Yes", "Min latency (ns)": 1970591, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 385.55, "QPS w/o loadgen overhead": 387.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.909419, "characteristics.90th_percentile_latency_ns": 2909419.0, "characteristics.90th_percentile_latency_s": 0.002909419, "characteristics.90th_percentile_latency_us": 2909.419, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d12b56872fc43459", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12109362, "90.00 percentile latency (ns)": 15441413, "90th percentile latency (ns)": 15441413, "95.00 percentile latency (ns)": 17265889, "97.00 percentile latency (ns)": 18513497, "99.00 percentile latency (ns)": 27124464, "99.90 percentile latency (ns)": 39782271, "Max latency (ns)": 77717283, "Mean latency (ns)": 13053336, "Min duration satisfied": "Yes", "Min latency (ns)": 11344257, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 76.45, "QPS w/o loadgen overhead": 76.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.441413, "characteristics.90th_percentile_latency_ns": 15441413.0, "characteristics.90th_percentile_latency_s": 0.015441413, "characteristics.90th_percentile_latency_us": 15441.413, "characteristics.accuracy": 71.676, "characteristics.good": 35838, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a29e53be6dac43ad", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2038138, "90.00 percentile latency (ns)": 3126667, "90th percentile latency (ns)": 3126667, "95.00 percentile latency (ns)": 4072564, "97.00 percentile latency (ns)": 4760179, "99.00 percentile latency (ns)": 6613221, "99.90 percentile latency (ns)": 21223083, "Max latency (ns)": 100902704, "Mean latency (ns)": 2374152, "Min duration satisfied": "Yes", "Min latency (ns)": 1845010, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 420.46, "QPS w/o loadgen overhead": 421.2, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.126667, "characteristics.90th_percentile_latency_ns": 3126667.0, "characteristics.90th_percentile_latency_s": 0.003126667, "characteristics.90th_percentile_latency_us": 3126.667, "characteristics.accuracy": 43.548, "characteristics.good": 21774, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "773e4495ebb7d89c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 51659808, "90.00 percentile latency (ns)": 66791119, "90th percentile latency (ns)": 66791119, "95.00 percentile latency (ns)": 69789362, "97.00 percentile latency (ns)": 73545652, "99.00 percentile latency (ns)": 83659562, "99.90 percentile latency (ns)": 95937694, "Max latency (ns)": 96031939, "Mean latency (ns)": 55595999, "Min duration satisfied": "Yes", "Min latency (ns)": 49652713, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 17.98, "QPS w/o loadgen overhead": 17.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 66.791119, "characteristics.90th_percentile_latency_ns": 66791119.0, "characteristics.90th_percentile_latency_s": 0.066791119, "characteristics.90th_percentile_latency_us": 66791.119, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f4ce8842d54343e6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10511502, "90.00 percentile latency (ns)": 16316656, "90th percentile latency (ns)": 16316656, "95.00 percentile latency (ns)": 17707702, "97.00 percentile latency (ns)": 18415417, "99.00 percentile latency (ns)": 24977250, "99.90 percentile latency (ns)": 38489542, "Max latency (ns)": 87004577, "Mean latency (ns)": 12015050, "Min duration satisfied": "Yes", "Min latency (ns)": 9222221, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 83.15, "QPS w/o loadgen overhead": 83.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.316656, "characteristics.90th_percentile_latency_ns": 16316656.0, "characteristics.90th_percentile_latency_s": 0.016316656, "characteristics.90th_percentile_latency_us": 16316.656, "characteristics.accuracy": 70.338, "characteristics.good": 35169, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3b42779fb4ee4daf", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8280278, "90.00 percentile latency (ns)": 13949141, "90th percentile latency (ns)": 13949141, "95.00 percentile latency (ns)": 15720742, "97.00 percentile latency (ns)": 16677041, "99.00 percentile latency (ns)": 21386502, "99.90 percentile latency (ns)": 37879631, "Max latency (ns)": 121418604, "Mean latency (ns)": 9806528, "Min duration satisfied": "Yes", "Min latency (ns)": 7434480, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 101.86, "QPS w/o loadgen overhead": 101.97, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.949141, "characteristics.90th_percentile_latency_ns": 13949141.0, "characteristics.90th_percentile_latency_s": 0.013949141, "characteristics.90th_percentile_latency_us": 13949.141, "characteristics.accuracy": 67.394, "characteristics.good": 33697, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "66cb94e01d48f3e2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8399144, "90.00 percentile latency (ns)": 11595456, "90th percentile latency (ns)": 11595456, "95.00 percentile latency (ns)": 13454121, "97.00 percentile latency (ns)": 14593398, "99.00 percentile latency (ns)": 18989668, "99.90 percentile latency (ns)": 37492362, "Max latency (ns)": 72093307, "Mean latency (ns)": 9227129, "Min duration satisfied": "Yes", "Min latency (ns)": 7519011, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 108.27, "QPS w/o loadgen overhead": 108.38, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.595456, "characteristics.90th_percentile_latency_ns": 11595456.0, "characteristics.90th_percentile_latency_s": 0.011595456, "characteristics.90th_percentile_latency_us": 11595.456, "characteristics.accuracy": 67.206, "characteristics.good": 33603, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c556444a7970a8d8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5025811, "90.00 percentile latency (ns)": 6934659, "90th percentile latency (ns)": 6934659, "95.00 percentile latency (ns)": 8571111, "97.00 percentile latency (ns)": 9785433, "99.00 percentile latency (ns)": 12650033, "99.90 percentile latency (ns)": 28357764, "Max latency (ns)": 92339673, "Mean latency (ns)": 5579657, "Min duration satisfied": "Yes", "Min latency (ns)": 4488572, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 178.67, "QPS w/o loadgen overhead": 179.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.934659, "characteristics.90th_percentile_latency_ns": 6934659.0, "characteristics.90th_percentile_latency_s": 0.006934659, "characteristics.90th_percentile_latency_us": 6934.659, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6431e906fe0d905d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3993943, "90.00 percentile latency (ns)": 5304029, "90th percentile latency (ns)": 5304029, "95.00 percentile latency (ns)": 6612483, "97.00 percentile latency (ns)": 7693997, "99.00 percentile latency (ns)": 10951014, "99.90 percentile latency (ns)": 26531194, "Max latency (ns)": 72346159, "Mean latency (ns)": 4474837, "Min duration satisfied": "Yes", "Min latency (ns)": 3613934, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 222.67, "QPS w/o loadgen overhead": 223.47, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.304029, "characteristics.90th_percentile_latency_ns": 5304029.0, "characteristics.90th_percentile_latency_s": 0.005304029, "characteristics.90th_percentile_latency_us": 5304.029, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e59b6fa7297b11ac", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3559387, "90.00 percentile latency (ns)": 5435181, "90th percentile latency (ns)": 5435181, "95.00 percentile latency (ns)": 6736615, "97.00 percentile latency (ns)": 7986077, "99.00 percentile latency (ns)": 10894076, "99.90 percentile latency (ns)": 30217225, "Max latency (ns)": 114173698, "Mean latency (ns)": 4149859, "Min duration satisfied": "Yes", "Min latency (ns)": 3132680, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 240.09, "QPS w/o loadgen overhead": 240.97, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.435181, "characteristics.90th_percentile_latency_ns": 5435181.0, "characteristics.90th_percentile_latency_s": 0.005435181, "characteristics.90th_percentile_latency_us": 5435.181, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ec529f9db6ec4bb2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5108554, "90.00 percentile latency (ns)": 7357345, "90th percentile latency (ns)": 7357345, "95.00 percentile latency (ns)": 9233035, "97.00 percentile latency (ns)": 10547617, "99.00 percentile latency (ns)": 13208616, "99.90 percentile latency (ns)": 27549607, "Max latency (ns)": 64658279, "Mean latency (ns)": 5800765, "Min duration satisfied": "Yes", "Min latency (ns)": 4621848, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 171.81, "QPS w/o loadgen overhead": 172.39, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.357345, "characteristics.90th_percentile_latency_ns": 7357345.0, "characteristics.90th_percentile_latency_s": 0.007357345, "characteristics.90th_percentile_latency_us": 7357.345, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7a4f2a87f853019c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2506962, "90.00 percentile latency (ns)": 4009494, "90th percentile latency (ns)": 4009494, "95.00 percentile latency (ns)": 5208396, "97.00 percentile latency (ns)": 6072083, "99.00 percentile latency (ns)": 8527202, "99.90 percentile latency (ns)": 22439672, "Max latency (ns)": 76744592, "Mean latency (ns)": 2942585, "Min duration satisfied": "Yes", "Min latency (ns)": 2318089, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 339.25, "QPS w/o loadgen overhead": 339.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.009494, "characteristics.90th_percentile_latency_ns": 4009494.0, "characteristics.90th_percentile_latency_s": 0.004009494, "characteristics.90th_percentile_latency_us": 4009.494, "characteristics.accuracy": 49.36, "characteristics.good": 24680, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5895d068c60607aa", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4959061, "90.00 percentile latency (ns)": 8142972, "90th percentile latency (ns)": 8142972, "95.00 percentile latency (ns)": 10051223, "97.00 percentile latency (ns)": 11332630, "99.00 percentile latency (ns)": 13323492, "99.90 percentile latency (ns)": 32219556, "Max latency (ns)": 124273742, "Mean latency (ns)": 5833856, "Min duration satisfied": "Yes", "Min latency (ns)": 4535677, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 171.2, "QPS w/o loadgen overhead": 171.41, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.142972, "characteristics.90th_percentile_latency_ns": 8142972.0, "characteristics.90th_percentile_latency_s": 0.008142972, "characteristics.90th_percentile_latency_us": 8142.972, "characteristics.accuracy": 61.982, "characteristics.good": 30991, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8671348669970487", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3190151, "90.00 percentile latency (ns)": 5107063, "90th percentile latency (ns)": 5107063, "95.00 percentile latency (ns)": 6558164, "97.00 percentile latency (ns)": 7674754, "99.00 percentile latency (ns)": 10647295, "99.90 percentile latency (ns)": 28116831, "Max latency (ns)": 40141659, "Mean latency (ns)": 3745890, "Min duration satisfied": "Yes", "Min latency (ns)": 2788981, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 265.77, "QPS w/o loadgen overhead": 266.96, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.107063, "characteristics.90th_percentile_latency_ns": 5107063.0, "characteristics.90th_percentile_latency_s": 0.005107063, "characteristics.90th_percentile_latency_us": 5107.063, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e828b35b5c046585", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1591396, "90.00 percentile latency (ns)": 2396821, "90th percentile latency (ns)": 2396821, "95.00 percentile latency (ns)": 3185795, "97.00 percentile latency (ns)": 3752624, "99.00 percentile latency (ns)": 5456919, "99.90 percentile latency (ns)": 20983748, "Max latency (ns)": 55156248, "Mean latency (ns)": 1843523, "Min duration satisfied": "Yes", "Min latency (ns)": 1295102, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 541.21, "QPS w/o loadgen overhead": 542.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.396821, "characteristics.90th_percentile_latency_ns": 2396821.0, "characteristics.90th_percentile_latency_s": 0.002396821, "characteristics.90th_percentile_latency_us": 2396.821, "characteristics.accuracy": 42.344, "characteristics.good": 21172, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "494627af1aaae8dc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13570809, "90.00 percentile latency (ns)": 19984117, "90th percentile latency (ns)": 19984117, "95.00 percentile latency (ns)": 21302576, "97.00 percentile latency (ns)": 22204728, "99.00 percentile latency (ns)": 30900664, "99.90 percentile latency (ns)": 68514394, "Max latency (ns)": 128615776, "Mean latency (ns)": 15198843, "Min duration satisfied": "Yes", "Min latency (ns)": 12668305, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 65.67, "QPS w/o loadgen overhead": 65.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.984117, "characteristics.90th_percentile_latency_ns": 19984117.0, "characteristics.90th_percentile_latency_s": 0.019984117, "characteristics.90th_percentile_latency_us": 19984.117, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "442994729341699d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4801520, "90.00 percentile latency (ns)": 6983741, "90th percentile latency (ns)": 6983741, "95.00 percentile latency (ns)": 8912254, "97.00 percentile latency (ns)": 10247489, "99.00 percentile latency (ns)": 12489329, "99.90 percentile latency (ns)": 27458206, "Max latency (ns)": 37717599, "Mean latency (ns)": 5461380, "Min duration satisfied": "Yes", "Min latency (ns)": 4492769, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 182.84, "QPS w/o loadgen overhead": 183.1, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.983741, "characteristics.90th_percentile_latency_ns": 6983741.0, "characteristics.90th_percentile_latency_s": 0.006983741, "characteristics.90th_percentile_latency_us": 6983.741, "characteristics.accuracy": 64.418, "characteristics.good": 32209, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8c4f848ee32a2155", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21205849, "90.00 percentile latency (ns)": 28491733, "90th percentile latency (ns)": 28491733, "95.00 percentile latency (ns)": 31140808, "97.00 percentile latency (ns)": 33566705, "99.00 percentile latency (ns)": 40379512, "99.90 percentile latency (ns)": 55318657, "Max latency (ns)": 60898867, "Mean latency (ns)": 23053920, "Min duration satisfied": "Yes", "Min latency (ns)": 19848990, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 43.33, "QPS w/o loadgen overhead": 43.38, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.491733, "characteristics.90th_percentile_latency_ns": 28491733.0, "characteristics.90th_percentile_latency_s": 0.028491733, "characteristics.90th_percentile_latency_us": 28491.733, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5a91a1041528b36b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2705505, "90.00 percentile latency (ns)": 3829911, "90th percentile latency (ns)": 3829911, "95.00 percentile latency (ns)": 4993550, "97.00 percentile latency (ns)": 5878104, "99.00 percentile latency (ns)": 8294988, "99.90 percentile latency (ns)": 21465314, "Max latency (ns)": 34418029, "Mean latency (ns)": 3063155, "Min duration satisfied": "Yes", "Min latency (ns)": 2278445, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 325.93, "QPS w/o loadgen overhead": 326.46, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.829911, "characteristics.90th_percentile_latency_ns": 3829911.0, "characteristics.90th_percentile_latency_s": 0.003829911, "characteristics.90th_percentile_latency_us": 3829.911, "characteristics.accuracy": 56.738, "characteristics.good": 28369, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d3b480399570bb61", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3472945, "90.00 percentile latency (ns)": 5717154, "90th percentile latency (ns)": 5717154, "95.00 percentile latency (ns)": 7195917, "97.00 percentile latency (ns)": 8165524, "99.00 percentile latency (ns)": 10776865, "99.90 percentile latency (ns)": 24271955, "Max latency (ns)": 45045690, "Mean latency (ns)": 4082551, "Min duration satisfied": "Yes", "Min latency (ns)": 3243368, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 244.63, "QPS w/o loadgen overhead": 244.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.717154, "characteristics.90th_percentile_latency_ns": 5717154.0, "characteristics.90th_percentile_latency_s": 0.005717154, "characteristics.90th_percentile_latency_us": 5717.154, "characteristics.accuracy": 57.044, "characteristics.good": 28522, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4225a27370222561", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14897556, "90.00 percentile latency (ns)": 21268333, "90th percentile latency (ns)": 21268333, "95.00 percentile latency (ns)": 22916310, "97.00 percentile latency (ns)": 24663428, "99.00 percentile latency (ns)": 32392761, "99.90 percentile latency (ns)": 56227513, "Max latency (ns)": 132096246, "Mean latency (ns)": 16446367, "Min duration satisfied": "Yes", "Min latency (ns)": 13775138, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 60.71, "QPS w/o loadgen overhead": 60.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.268333, "characteristics.90th_percentile_latency_ns": 21268333.0, "characteristics.90th_percentile_latency_s": 0.021268333, "characteristics.90th_percentile_latency_us": 21268.333, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2e4b178e2ba3a15a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2110559, "90.00 percentile latency (ns)": 3750090, "90th percentile latency (ns)": 3750090, "95.00 percentile latency (ns)": 4759032, "97.00 percentile latency (ns)": 5643936, "99.00 percentile latency (ns)": 8028428, "99.90 percentile latency (ns)": 22896367, "Max latency (ns)": 67397358, "Mean latency (ns)": 2570345, "Min duration satisfied": "Yes", "Min latency (ns)": 1814674, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 387.03, "QPS w/o loadgen overhead": 389.05, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.75009, "characteristics.90th_percentile_latency_ns": 3750090.0, "characteristics.90th_percentile_latency_s": 0.00375009, "characteristics.90th_percentile_latency_us": 3750.09, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6243d51713a4f58b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8112086, "90.00 percentile latency (ns)": 12402317, "90th percentile latency (ns)": 12402317, "95.00 percentile latency (ns)": 14326093, "97.00 percentile latency (ns)": 15410819, "99.00 percentile latency (ns)": 18444538, "99.90 percentile latency (ns)": 35852002, "Max latency (ns)": 91423324, "Mean latency (ns)": 9190896, "Min duration satisfied": "Yes", "Min latency (ns)": 7444117, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 108.58, "QPS w/o loadgen overhead": 108.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.402317, "characteristics.90th_percentile_latency_ns": 12402317.0, "characteristics.90th_percentile_latency_s": 0.012402317, "characteristics.90th_percentile_latency_us": 12402.317, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "927451ebb9af4cdf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4694242, "90.00 percentile latency (ns)": 6117692, "90th percentile latency (ns)": 6117692, "95.00 percentile latency (ns)": 7467539, "97.00 percentile latency (ns)": 8688998, "99.00 percentile latency (ns)": 11693122, "99.90 percentile latency (ns)": 30068279, "Max latency (ns)": 67193497, "Mean latency (ns)": 5181263, "Min duration satisfied": "Yes", "Min latency (ns)": 4319346, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 192.27, "QPS w/o loadgen overhead": 193.0, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.117692, "characteristics.90th_percentile_latency_ns": 6117692.0, "characteristics.90th_percentile_latency_s": 0.006117692, "characteristics.90th_percentile_latency_us": 6117.692, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "de975b3148cc8bbd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6929562, "90.00 percentile latency (ns)": 9142153, "90th percentile latency (ns)": 9142153, "95.00 percentile latency (ns)": 11048722, "97.00 percentile latency (ns)": 12337281, "99.00 percentile latency (ns)": 15326310, "99.90 percentile latency (ns)": 34760851, "Max latency (ns)": 79872726, "Mean latency (ns)": 7616493, "Min duration satisfied": "Yes", "Min latency (ns)": 6512623, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 130.95, "QPS w/o loadgen overhead": 131.29, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.142153, "characteristics.90th_percentile_latency_ns": 9142153.0, "characteristics.90th_percentile_latency_s": 0.009142153, "characteristics.90th_percentile_latency_us": 9142.153, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "54886a9fd8ee882b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2825887, "90.00 percentile latency (ns)": 4547982, "90th percentile latency (ns)": 4547982, "95.00 percentile latency (ns)": 5654272, "97.00 percentile latency (ns)": 6549864, "99.00 percentile latency (ns)": 9137500, "99.90 percentile latency (ns)": 25101644, "Max latency (ns)": 78271276, "Mean latency (ns)": 3303112, "Min duration satisfied": "Yes", "Min latency (ns)": 2411021, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 301.47, "QPS w/o loadgen overhead": 302.74, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.547982, "characteristics.90th_percentile_latency_ns": 4547982.0, "characteristics.90th_percentile_latency_s": 0.004547982, "characteristics.90th_percentile_latency_us": 4547.982, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e78c90229e57b4d9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4911861, "90.00 percentile latency (ns)": 6644460, "90th percentile latency (ns)": 6644460, "95.00 percentile latency (ns)": 8404260, "97.00 percentile latency (ns)": 9723878, "99.00 percentile latency (ns)": 12628696, "99.90 percentile latency (ns)": 29728974, "Max latency (ns)": 50145804, "Mean latency (ns)": 5449559, "Min duration satisfied": "Yes", "Min latency (ns)": 4431582, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 182.93, "QPS w/o loadgen overhead": 183.5, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.64446, "characteristics.90th_percentile_latency_ns": 6644460.0, "characteristics.90th_percentile_latency_s": 0.00664446, "characteristics.90th_percentile_latency_us": 6644.46, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f4382572274fbca6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6332926, "90.00 percentile latency (ns)": 10220590, "90th percentile latency (ns)": 10220590, "95.00 percentile latency (ns)": 11958524, "97.00 percentile latency (ns)": 12961546, "99.00 percentile latency (ns)": 15393528, "99.90 percentile latency (ns)": 32383321, "Max latency (ns)": 65328075, "Mean latency (ns)": 7311425, "Min duration satisfied": "Yes", "Min latency (ns)": 5787974, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 136.44, "QPS w/o loadgen overhead": 136.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.22059, "characteristics.90th_percentile_latency_ns": 10220590.0, "characteristics.90th_percentile_latency_s": 0.01022059, "characteristics.90th_percentile_latency_us": 10220.59, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7142848066531d70", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15647016, "90.00 percentile latency (ns)": 22155169, "90th percentile latency (ns)": 22155169, "95.00 percentile latency (ns)": 24195035, "97.00 percentile latency (ns)": 27357508, "99.00 percentile latency (ns)": 34161962, "99.90 percentile latency (ns)": 46351932, "Max latency (ns)": 60826320, "Mean latency (ns)": 17475894, "Min duration satisfied": "Yes", "Min latency (ns)": 12892336, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 57.16, "QPS w/o loadgen overhead": 57.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.155169, "characteristics.90th_percentile_latency_ns": 22155169.0, "characteristics.90th_percentile_latency_s": 0.022155169, "characteristics.90th_percentile_latency_us": 22155.169, "characteristics.accuracy": 71.23, "characteristics.good": 35615, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "28e50b11d48f5b5d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 31983467, "90.00 percentile latency (ns)": 41380131, "90th percentile latency (ns)": 41380131, "95.00 percentile latency (ns)": 45465492, "97.00 percentile latency (ns)": 48418452, "99.00 percentile latency (ns)": 55658382, "99.90 percentile latency (ns)": 79705121, "Max latency (ns)": 119179089, "Mean latency (ns)": 33971103, "Min duration satisfied": "Yes", "Min latency (ns)": 29749674, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 29.42, "QPS w/o loadgen overhead": 29.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 41.380131, "characteristics.90th_percentile_latency_ns": 41380131.0, "characteristics.90th_percentile_latency_s": 0.041380131, "characteristics.90th_percentile_latency_us": 41380.131, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f84186b64284a32e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4607270, "90.00 percentile latency (ns)": 7092963, "90th percentile latency (ns)": 7092963, "95.00 percentile latency (ns)": 8553164, "97.00 percentile latency (ns)": 9833900, "99.00 percentile latency (ns)": 12338954, "99.90 percentile latency (ns)": 25309715, "Max latency (ns)": 39768198, "Mean latency (ns)": 5310523, "Min duration satisfied": "Yes", "Min latency (ns)": 4141071, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 187.71, "QPS w/o loadgen overhead": 188.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.092963, "characteristics.90th_percentile_latency_ns": 7092963.0, "characteristics.90th_percentile_latency_s": 0.007092963, "characteristics.90th_percentile_latency_us": 7092.963, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0dd91346244dfa8e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 45358192, "90.00 percentile latency (ns)": 57612452, "90th percentile latency (ns)": 57612452, "95.00 percentile latency (ns)": 60772717, "97.00 percentile latency (ns)": 62859783, "99.00 percentile latency (ns)": 67234597, "99.90 percentile latency (ns)": 83882296, "Max latency (ns)": 99341174, "Mean latency (ns)": 48233655, "Min duration satisfied": "Yes", "Min latency (ns)": 40503997, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 20.72, "QPS w/o loadgen overhead": 20.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 57.612452, "characteristics.90th_percentile_latency_ns": 57612452.0, "characteristics.90th_percentile_latency_s": 0.057612452, "characteristics.90th_percentile_latency_us": 57612.452, "characteristics.accuracy": 76.374, "characteristics.good": 38187, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f9143f7a405d682e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3763851, "90.00 percentile latency (ns)": 5793127, "90th percentile latency (ns)": 5793127, "95.00 percentile latency (ns)": 7235689, "97.00 percentile latency (ns)": 8224822, "99.00 percentile latency (ns)": 11005492, "99.90 percentile latency (ns)": 24829383, "Max latency (ns)": 53818382, "Mean latency (ns)": 4330018, "Min duration satisfied": "Yes", "Min latency (ns)": 3404859, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 230.63, "QPS w/o loadgen overhead": 230.95, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.793127, "characteristics.90th_percentile_latency_ns": 5793127.0, "characteristics.90th_percentile_latency_s": 0.005793127, "characteristics.90th_percentile_latency_us": 5793.127, "characteristics.accuracy": 54.598, "characteristics.good": 27299, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a962d74e63b9f960", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2526139, "90.00 percentile latency (ns)": 3287008, "90th percentile latency (ns)": 3287008, "95.00 percentile latency (ns)": 4142954, "97.00 percentile latency (ns)": 4856590, "99.00 percentile latency (ns)": 6995829, "99.90 percentile latency (ns)": 20903901, "Max latency (ns)": 36392882, "Mean latency (ns)": 2795431, "Min duration satisfied": "Yes", "Min latency (ns)": 2226989, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 356.73, "QPS w/o loadgen overhead": 357.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.287008, "characteristics.90th_percentile_latency_ns": 3287008.0, "characteristics.90th_percentile_latency_s": 0.003287008, "characteristics.90th_percentile_latency_us": 3287.008, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "45ae8e3d3c964312", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10604818, "90.00 percentile latency (ns)": 15938412, "90th percentile latency (ns)": 15938412, "95.00 percentile latency (ns)": 17149087, "97.00 percentile latency (ns)": 17912700, "99.00 percentile latency (ns)": 24453452, "99.90 percentile latency (ns)": 45424383, "Max latency (ns)": 75162704, "Mean latency (ns)": 11944790, "Min duration satisfied": "Yes", "Min latency (ns)": 9387008, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 83.64, "QPS w/o loadgen overhead": 83.72, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.938412, "characteristics.90th_percentile_latency_ns": 15938412.0, "characteristics.90th_percentile_latency_s": 0.015938412, "characteristics.90th_percentile_latency_us": 15938.412, "characteristics.accuracy": 68.126, "characteristics.good": 34063, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "01833151f831ea6e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9839084, "90.00 percentile latency (ns)": 13872949, "90th percentile latency (ns)": 13872949, "95.00 percentile latency (ns)": 16245484, "97.00 percentile latency (ns)": 17381061, "99.00 percentile latency (ns)": 22943899, "99.90 percentile latency (ns)": 35700217, "Max latency (ns)": 72436071, "Mean latency (ns)": 10868603, "Min duration satisfied": "Yes", "Min latency (ns)": 8839034, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 91.86, "QPS w/o loadgen overhead": 92.01, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.872949, "characteristics.90th_percentile_latency_ns": 13872949.0, "characteristics.90th_percentile_latency_s": 0.013872949, "characteristics.90th_percentile_latency_us": 13872.949, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d0ab4847bcf59e6c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5754824, "90.00 percentile latency (ns)": 9023177, "90th percentile latency (ns)": 9023177, "95.00 percentile latency (ns)": 10783469, "97.00 percentile latency (ns)": 12168213, "99.00 percentile latency (ns)": 14763628, "99.90 percentile latency (ns)": 31632321, "Max latency (ns)": 114989675, "Mean latency (ns)": 6679444, "Min duration satisfied": "Yes", "Min latency (ns)": 5025886, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 149.26, "QPS w/o loadgen overhead": 149.71, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.023177, "characteristics.90th_percentile_latency_ns": 9023177.0, "characteristics.90th_percentile_latency_s": 0.009023177, "characteristics.90th_percentile_latency_us": 9023.177, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "30edc40b88bfc0f4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6997540, "90.00 percentile latency (ns)": 9418983, "90th percentile latency (ns)": 9418983, "95.00 percentile latency (ns)": 11250228, "97.00 percentile latency (ns)": 12431493, "99.00 percentile latency (ns)": 15358816, "99.90 percentile latency (ns)": 38818923, "Max latency (ns)": 71777679, "Mean latency (ns)": 7713203, "Min duration satisfied": "Yes", "Min latency (ns)": 6344872, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 129.49, "QPS w/o loadgen overhead": 129.65, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.418983, "characteristics.90th_percentile_latency_ns": 9418983.0, "characteristics.90th_percentile_latency_s": 0.009418983, "characteristics.90th_percentile_latency_us": 9418.983, "characteristics.accuracy": 64.768, "characteristics.good": 32384, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a534a7ce4d24a9f8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8418474, "90.00 percentile latency (ns)": 12323091, "90th percentile latency (ns)": 12323091, "95.00 percentile latency (ns)": 14483698, "97.00 percentile latency (ns)": 15612738, "99.00 percentile latency (ns)": 21004619, "99.90 percentile latency (ns)": 39125078, "Max latency (ns)": 132804648, "Mean latency (ns)": 9378580, "Min duration satisfied": "Yes", "Min latency (ns)": 7612105, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 106.43, "QPS w/o loadgen overhead": 106.63, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.323091, "characteristics.90th_percentile_latency_ns": 12323091.0, "characteristics.90th_percentile_latency_s": 0.012323091, "characteristics.90th_percentile_latency_us": 12323.091, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "61b4c921db48c7ae", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6397121, "90.00 percentile latency (ns)": 9312341, "90th percentile latency (ns)": 9312341, "95.00 percentile latency (ns)": 11220032, "97.00 percentile latency (ns)": 12395791, "99.00 percentile latency (ns)": 14694095, "99.90 percentile latency (ns)": 30173561, "Max latency (ns)": 77117525, "Mean latency (ns)": 7171429, "Min duration satisfied": "Yes", "Min latency (ns)": 5489724, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 139.27, "QPS w/o loadgen overhead": 139.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.312341, "characteristics.90th_percentile_latency_ns": 9312341.0, "characteristics.90th_percentile_latency_s": 0.009312341, "characteristics.90th_percentile_latency_us": 9312.341, "characteristics.accuracy": 64.12, "characteristics.good": 32060, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2814370a56bdaf93", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4670001, "90.00 percentile latency (ns)": 6747202, "90th percentile latency (ns)": 6747202, "95.00 percentile latency (ns)": 8500922, "97.00 percentile latency (ns)": 9783774, "99.00 percentile latency (ns)": 12502149, "99.90 percentile latency (ns)": 29194620, "Max latency (ns)": 116705776, "Mean latency (ns)": 5303339, "Min duration satisfied": "Yes", "Min latency (ns)": 4101393, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 187.92, "QPS w/o loadgen overhead": 188.56, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.747202, "characteristics.90th_percentile_latency_ns": 6747202.0, "characteristics.90th_percentile_latency_s": 0.006747202, "characteristics.90th_percentile_latency_us": 6747.202, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b4e2f9d4d0976011", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8034802, "90.00 percentile latency (ns)": 11373913, "90th percentile latency (ns)": 11373913, "95.00 percentile latency (ns)": 13670092, "97.00 percentile latency (ns)": 15041392, "99.00 percentile latency (ns)": 19687609, "99.90 percentile latency (ns)": 33769305, "Max latency (ns)": 55719716, "Mean latency (ns)": 8868364, "Min duration satisfied": "Yes", "Min latency (ns)": 7166150, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 112.51, "QPS w/o loadgen overhead": 112.76, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.373913, "characteristics.90th_percentile_latency_ns": 11373913.0, "characteristics.90th_percentile_latency_s": 0.011373913, "characteristics.90th_percentile_latency_us": 11373.913, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet-v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "25b085ae2c4ecfa0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6404819, "90.00 percentile latency (ns)": 10753006, "90th percentile latency (ns)": 10753006, "95.00 percentile latency (ns)": 12608318, "97.00 percentile latency (ns)": 13665387, "99.00 percentile latency (ns)": 16538150, "99.90 percentile latency (ns)": 36572001, "Max latency (ns)": 119449986, "Mean latency (ns)": 7561171, "Min duration satisfied": "Yes", "Min latency (ns)": 5762712, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 132.12, "QPS w/o loadgen overhead": 132.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.753006, "characteristics.90th_percentile_latency_ns": 10753006.0, "characteristics.90th_percentile_latency_s": 0.010753006, "characteristics.90th_percentile_latency_us": 10753.006, "characteristics.accuracy": 64.98, "characteristics.good": 32490, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7416486640519faa", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9968214, "90.00 percentile latency (ns)": 13864617, "90th percentile latency (ns)": 13864617, "95.00 percentile latency (ns)": 16311457, "97.00 percentile latency (ns)": 17413893, "99.00 percentile latency (ns)": 23414240, "99.90 percentile latency (ns)": 42304908, "Max latency (ns)": 126889928, "Mean latency (ns)": 10971983, "Min duration satisfied": "Yes", "Min latency (ns)": 8875067, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 90.97, "QPS w/o loadgen overhead": 91.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.864617, "characteristics.90th_percentile_latency_ns": 13864617.0, "characteristics.90th_percentile_latency_s": 0.013864617, "characteristics.90th_percentile_latency_us": 13864.617, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "78df80407a8cebd9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4781676, "90.00 percentile latency (ns)": 7148242, "90th percentile latency (ns)": 7148242, "95.00 percentile latency (ns)": 9019488, "97.00 percentile latency (ns)": 10419452, "99.00 percentile latency (ns)": 13044558, "99.90 percentile latency (ns)": 32743861, "Max latency (ns)": 119847677, "Mean latency (ns)": 5474498, "Min duration satisfied": "Yes", "Min latency (ns)": 4397244, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 182.12, "QPS w/o loadgen overhead": 182.67, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.148242, "characteristics.90th_percentile_latency_ns": 7148242.0, "characteristics.90th_percentile_latency_s": 0.007148242, "characteristics.90th_percentile_latency_us": 7148.242, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0a03a4d1cbfdf168", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1767790, "90.00 percentile latency (ns)": 3067496, "90th percentile latency (ns)": 3067496, "95.00 percentile latency (ns)": 3998513, "97.00 percentile latency (ns)": 4732626, "99.00 percentile latency (ns)": 6746795, "99.90 percentile latency (ns)": 22834130, "Max latency (ns)": 90419231, "Mean latency (ns)": 2163828, "Min duration satisfied": "Yes", "Min latency (ns)": 1510595, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 460.46, "QPS w/o loadgen overhead": 462.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.067496, "characteristics.90th_percentile_latency_ns": 3067496.0, "characteristics.90th_percentile_latency_s": 0.003067496, "characteristics.90th_percentile_latency_us": 3067.496, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "166444bcbbe733fe", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3101101, "90.00 percentile latency (ns)": 4606962, "90th percentile latency (ns)": 4606962, "95.00 percentile latency (ns)": 5821226, "97.00 percentile latency (ns)": 6873049, "99.00 percentile latency (ns)": 9193634, "99.90 percentile latency (ns)": 24357460, "Max latency (ns)": 53125268, "Mean latency (ns)": 3546216, "Min duration satisfied": "Yes", "Min latency (ns)": 2561205, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 281.01, "QPS w/o loadgen overhead": 281.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.606962, "characteristics.90th_percentile_latency_ns": 4606962.0, "characteristics.90th_percentile_latency_s": 0.004606962, "characteristics.90th_percentile_latency_us": 4606.962, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f887ddca9a054eaf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3298463, "90.00 percentile latency (ns)": 4989617, "90th percentile latency (ns)": 4989617, "95.00 percentile latency (ns)": 6185323, "97.00 percentile latency (ns)": 7223741, "99.00 percentile latency (ns)": 9532973, "99.90 percentile latency (ns)": 25272486, "Max latency (ns)": 68116607, "Mean latency (ns)": 3794261, "Min duration satisfied": "Yes", "Min latency (ns)": 3033362, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 262.51, "QPS w/o loadgen overhead": 263.56, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.989617, "characteristics.90th_percentile_latency_ns": 4989617.0, "characteristics.90th_percentile_latency_s": 0.004989617, "characteristics.90th_percentile_latency_us": 4989.617, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "96ae21eb314d5699", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3258831, "90.00 percentile latency (ns)": 4735441, "90th percentile latency (ns)": 4735441, "95.00 percentile latency (ns)": 6081996, "97.00 percentile latency (ns)": 7083609, "99.00 percentile latency (ns)": 10020410, "99.90 percentile latency (ns)": 25934489, "Max latency (ns)": 118040027, "Mean latency (ns)": 3740010, "Min duration satisfied": "Yes", "Min latency (ns)": 3003557, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 267.0, "QPS w/o loadgen overhead": 267.38, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.735441, "characteristics.90th_percentile_latency_ns": 4735441.0, "characteristics.90th_percentile_latency_s": 0.004735441, "characteristics.90th_percentile_latency_us": 4735.441, "characteristics.accuracy": 55.55, "characteristics.good": 27775, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "da8e9dda996843a5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3953933, "90.00 percentile latency (ns)": 5825632, "90th percentile latency (ns)": 5825632, "95.00 percentile latency (ns)": 7395268, "97.00 percentile latency (ns)": 8692285, "99.00 percentile latency (ns)": 11412757, "99.90 percentile latency (ns)": 27182986, "Max latency (ns)": 125649384, "Mean latency (ns)": 4519968, "Min duration satisfied": "Yes", "Min latency (ns)": 3315570, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 220.53, "QPS w/o loadgen overhead": 221.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.825632, "characteristics.90th_percentile_latency_ns": 5825632.0, "characteristics.90th_percentile_latency_s": 0.005825632, "characteristics.90th_percentile_latency_us": 5825.632, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dd8bca42d0a69b99", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 67889184, "90.00 percentile latency (ns)": 84102452, "90th percentile latency (ns)": 84102452, "95.00 percentile latency (ns)": 87763643, "97.00 percentile latency (ns)": 89312520, "99.00 percentile latency (ns)": 95767175, "99.90 percentile latency (ns)": 110162958, "Max latency (ns)": 178738883, "Mean latency (ns)": 71423699, "Min duration satisfied": "Yes", "Min latency (ns)": 66685767, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 14.0, "QPS w/o loadgen overhead": 14.0, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 84.102452, "characteristics.90th_percentile_latency_ns": 84102452.0, "characteristics.90th_percentile_latency_s": 0.084102452, "characteristics.90th_percentile_latency_us": 84102.452, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "rpi4coral-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "MakerHawk Pi-FAN DC Brushless Cooling Fan LD3007MS", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4coral-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4899d4daf2931227", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 31877495, "90.00 percentile latency (ns)": 42728287, "90th percentile latency (ns)": 42728287, "95.00 percentile latency (ns)": 52028951, "97.00 percentile latency (ns)": 56685429, "99.00 percentile latency (ns)": 73314095, "99.90 percentile latency (ns)": 129417673, "Max latency (ns)": 136967947, "Mean latency (ns)": 34750909, "Min duration satisfied": "Yes", "Min latency (ns)": 30833201, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 28.74, "QPS w/o loadgen overhead": 28.78, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.728287, "characteristics.90th_percentile_latency_ns": 42728287.0, "characteristics.90th_percentile_latency_s": 0.042728287, "characteristics.90th_percentile_latency_us": 42728.287, "characteristics.accuracy": 71.23, "characteristics.good": 35615, "characteristics.total": 50000, "ck_system": "rpi4coral-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "MakerHawk Pi-FAN DC Brushless Cooling Fan LD3007MS", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4coral-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f1af5c2114684be5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 70886064, "90.00 percentile latency (ns)": 71547265, "90th percentile latency (ns)": 71547265, "95.00 percentile latency (ns)": 71943339, "97.00 percentile latency (ns)": 72174050, "99.00 percentile latency (ns)": 72885726, "99.90 percentile latency (ns)": 83378105, "Max latency (ns)": 84339436, "Mean latency (ns)": 71034742, "Min duration satisfied": "Yes", "Min latency (ns)": 70354665, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 14.07, "QPS w/o loadgen overhead": 14.08, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 71.547265, "characteristics.90th_percentile_latency_ns": 71547265.0, "characteristics.90th_percentile_latency_s": 0.071547265, "characteristics.90th_percentile_latency_us": 71547.265, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "04c276c194e6460a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 367999010, "90.00 percentile latency (ns)": 369180242, "90th percentile latency (ns)": 369180242, "95.00 percentile latency (ns)": 369547457, "97.00 percentile latency (ns)": 369983217, "99.00 percentile latency (ns)": 372941026, "99.90 percentile latency (ns)": 390337106, "Max latency (ns)": 433434032, "Mean latency (ns)": 368240673, "Min duration satisfied": "Yes", "Min latency (ns)": 366244086, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.72, "QPS w/o loadgen overhead": 2.72, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 369.180242, "characteristics.90th_percentile_latency_ns": 369180242.0, "characteristics.90th_percentile_latency_s": 0.369180242, "characteristics.90th_percentile_latency_us": 369180.242, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ec83a9ee10024e2d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 203582456, "90.00 percentile latency (ns)": 204266654, "90th percentile latency (ns)": 204266654, "95.00 percentile latency (ns)": 204449593, "97.00 percentile latency (ns)": 204587742, "99.00 percentile latency (ns)": 205185702, "99.90 percentile latency (ns)": 211535294, "Max latency (ns)": 221396534, "Mean latency (ns)": 203601053, "Min duration satisfied": "Yes", "Min latency (ns)": 201406576, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 4.91, "QPS w/o loadgen overhead": 4.91, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 204.266654, "characteristics.90th_percentile_latency_ns": 204266654.0, "characteristics.90th_percentile_latency_s": 0.204266654, "characteristics.90th_percentile_latency_us": 204266.654, "characteristics.accuracy": 71.274, "characteristics.good": 35637, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "47ddb72435843425", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 32365690, "90.00 percentile latency (ns)": 37517556, "90th percentile latency (ns)": 37517556, "95.00 percentile latency (ns)": 43617590, "97.00 percentile latency (ns)": 45728015, "99.00 percentile latency (ns)": 50245935, "99.90 percentile latency (ns)": 61438665, "Max latency (ns)": 65509365, "Mean latency (ns)": 30907944, "Min duration satisfied": "Yes", "Min latency (ns)": 11962778, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 32.32, "QPS w/o loadgen overhead": 32.35, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 37.517556, "characteristics.90th_percentile_latency_ns": 37517556.0, "characteristics.90th_percentile_latency_s": 0.037517556, "characteristics.90th_percentile_latency_us": 37517.556, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2bb9fb9d4a21880b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 159929863, "90.00 percentile latency (ns)": 178912196, "90th percentile latency (ns)": 178912196, "95.00 percentile latency (ns)": 190743600, "97.00 percentile latency (ns)": 215886960, "99.00 percentile latency (ns)": 261333131, "99.90 percentile latency (ns)": 317856943, "Max latency (ns)": 319960721, "Mean latency (ns)": 166843899, "Min duration satisfied": "Yes", "Min latency (ns)": 155759042, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 5.99, "QPS w/o loadgen overhead": 5.99, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 178.912196, "characteristics.90th_percentile_latency_ns": 178912196.0, "characteristics.90th_percentile_latency_s": 0.178912196, "characteristics.90th_percentile_latency_us": 178912.196, "characteristics.accuracy": 78.536, "characteristics.good": 39268, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b8a9129b3028e9e2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11360566, "90.00 percentile latency (ns)": 12799281, "90th percentile latency (ns)": 12799281, "95.00 percentile latency (ns)": 16472872, "97.00 percentile latency (ns)": 17825985, "99.00 percentile latency (ns)": 31098437, "99.90 percentile latency (ns)": 76038064, "Max latency (ns)": 109230785, "Mean latency (ns)": 12103096, "Min duration satisfied": "Yes", "Min latency (ns)": 9897658, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 82.51, "QPS w/o loadgen overhead": 82.62, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.799281, "characteristics.90th_percentile_latency_ns": 12799281.0, "characteristics.90th_percentile_latency_s": 0.012799281, "characteristics.90th_percentile_latency_us": 12799.281, "characteristics.accuracy": 63.65, "characteristics.good": 31825, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7b1c85c4a148d425", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14911819, "90.00 percentile latency (ns)": 17111863, "90th percentile latency (ns)": 17111863, "95.00 percentile latency (ns)": 19723613, "97.00 percentile latency (ns)": 21941258, "99.00 percentile latency (ns)": 26034726, "99.90 percentile latency (ns)": 34701129, "Max latency (ns)": 38402324, "Mean latency (ns)": 15383792, "Min duration satisfied": "Yes", "Min latency (ns)": 11800755, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 64.87, "QPS w/o loadgen overhead": 65.0, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.111863, "characteristics.90th_percentile_latency_ns": 17111863.0, "characteristics.90th_percentile_latency_s": 0.017111863, "characteristics.90th_percentile_latency_us": 17111.863, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1ae764406bc86b52", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16184366, "90.00 percentile latency (ns)": 18372203, "90th percentile latency (ns)": 18372203, "95.00 percentile latency (ns)": 21286144, "97.00 percentile latency (ns)": 23634010, "99.00 percentile latency (ns)": 27173867, "99.90 percentile latency (ns)": 32456551, "Max latency (ns)": 40444452, "Mean latency (ns)": 16596230, "Min duration satisfied": "Yes", "Min latency (ns)": 6383522, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 60.16, "QPS w/o loadgen overhead": 60.25, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.372203, "characteristics.90th_percentile_latency_ns": 18372203.0, "characteristics.90th_percentile_latency_s": 0.018372203, "characteristics.90th_percentile_latency_us": 18372.203, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c73774b35bfd70e5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 23273146, "90.00 percentile latency (ns)": 26246142, "90th percentile latency (ns)": 26246142, "95.00 percentile latency (ns)": 30055019, "97.00 percentile latency (ns)": 32656098, "99.00 percentile latency (ns)": 36196830, "99.90 percentile latency (ns)": 45611528, "Max latency (ns)": 45780272, "Mean latency (ns)": 22409061, "Min duration satisfied": "Yes", "Min latency (ns)": 9274274, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 44.58, "QPS w/o loadgen overhead": 44.62, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.246142, "characteristics.90th_percentile_latency_ns": 26246142.0, "characteristics.90th_percentile_latency_s": 0.026246142, "characteristics.90th_percentile_latency_us": 26246.142, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "89e9c99410d40c09", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20499108, "90.00 percentile latency (ns)": 23846018, "90th percentile latency (ns)": 23846018, "95.00 percentile latency (ns)": 25805182, "97.00 percentile latency (ns)": 27409162, "99.00 percentile latency (ns)": 30961041, "99.90 percentile latency (ns)": 35256411, "Max latency (ns)": 38387407, "Mean latency (ns)": 19813054, "Min duration satisfied": "Yes", "Min latency (ns)": 13024389, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 50.44, "QPS w/o loadgen overhead": 50.47, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.846018, "characteristics.90th_percentile_latency_ns": 23846018.0, "characteristics.90th_percentile_latency_s": 0.023846018, "characteristics.90th_percentile_latency_us": 23846.018, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "03583e52488c8d6c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 26827508, "90.00 percentile latency (ns)": 31741509, "90th percentile latency (ns)": 31741509, "95.00 percentile latency (ns)": 36928352, "97.00 percentile latency (ns)": 39414442, "99.00 percentile latency (ns)": 42666484, "99.90 percentile latency (ns)": 51494187, "Max latency (ns)": 57397830, "Mean latency (ns)": 26698731, "Min duration satisfied": "Yes", "Min latency (ns)": 10007785, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 37.41, "QPS w/o loadgen overhead": 37.45, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 31.741509, "characteristics.90th_percentile_latency_ns": 31741509.0, "characteristics.90th_percentile_latency_s": 0.031741509, "characteristics.90th_percentile_latency_us": 31741.509, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "21826af4bf524c98", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 50075733, "90.00 percentile latency (ns)": 64974738, "90th percentile latency (ns)": 64974738, "95.00 percentile latency (ns)": 69004784, "97.00 percentile latency (ns)": 72549559, "99.00 percentile latency (ns)": 82036117, "99.90 percentile latency (ns)": 138628253, "Max latency (ns)": 207062578, "Mean latency (ns)": 53385065, "Min duration satisfied": "Yes", "Min latency (ns)": 48722677, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 18.73, "QPS w/o loadgen overhead": 18.73, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 64.974738, "characteristics.90th_percentile_latency_ns": 64974738.0, "characteristics.90th_percentile_latency_s": 0.064974738, "characteristics.90th_percentile_latency_us": 64974.738, "characteristics.accuracy": 74.136, "characteristics.good": 37068, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "428f4fa2b5a6b83b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9501327, "90.00 percentile latency (ns)": 10902670, "90th percentile latency (ns)": 10902670, "95.00 percentile latency (ns)": 13927093, "97.00 percentile latency (ns)": 15532480, "99.00 percentile latency (ns)": 28442505, "99.90 percentile latency (ns)": 68388535, "Max latency (ns)": 226593381, "Mean latency (ns)": 10220871, "Min duration satisfied": "Yes", "Min latency (ns)": 8355930, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 97.7, "QPS w/o loadgen overhead": 97.84, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.90267, "characteristics.90th_percentile_latency_ns": 10902670.0, "characteristics.90th_percentile_latency_s": 0.01090267, "characteristics.90th_percentile_latency_us": 10902.67, "characteristics.accuracy": 61.948, "characteristics.good": 30974, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "085f2220eef1ad2d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6381714, "90.00 percentile latency (ns)": 7223441, "90th percentile latency (ns)": 7223441, "95.00 percentile latency (ns)": 9431140, "97.00 percentile latency (ns)": 10366473, "99.00 percentile latency (ns)": 25244801, "99.90 percentile latency (ns)": 62076664, "Max latency (ns)": 182316731, "Mean latency (ns)": 7028816, "Min duration satisfied": "Yes", "Min latency (ns)": 5310473, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 142.08, "QPS w/o loadgen overhead": 142.27, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.223441, "characteristics.90th_percentile_latency_ns": 7223441.0, "characteristics.90th_percentile_latency_s": 0.007223441, "characteristics.90th_percentile_latency_us": 7223.441, "characteristics.accuracy": 49.19, "characteristics.good": 24595, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c4bcc15edf49c9a9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 26666840, "90.00 percentile latency (ns)": 33437846, "90th percentile latency (ns)": 33437846, "95.00 percentile latency (ns)": 37800613, "97.00 percentile latency (ns)": 41092006, "99.00 percentile latency (ns)": 47619626, "99.90 percentile latency (ns)": 60094184, "Max latency (ns)": 92551923, "Mean latency (ns)": 28227963, "Min duration satisfied": "Yes", "Min latency (ns)": 24900084, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 35.39, "QPS w/o loadgen overhead": 35.43, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.437846, "characteristics.90th_percentile_latency_ns": 33437846.0, "characteristics.90th_percentile_latency_s": 0.033437846, "characteristics.90th_percentile_latency_us": 33437.846, "characteristics.accuracy": 73.556, "characteristics.good": 36778, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f4f68da4d53b7093", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20710875, "90.00 percentile latency (ns)": 23974840, "90th percentile latency (ns)": 23974840, "95.00 percentile latency (ns)": 28287826, "97.00 percentile latency (ns)": 30358673, "99.00 percentile latency (ns)": 33166368, "99.90 percentile latency (ns)": 42881271, "Max latency (ns)": 52803545, "Mean latency (ns)": 20756396, "Min duration satisfied": "Yes", "Min latency (ns)": 7948803, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 48.1, "QPS w/o loadgen overhead": 48.18, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.97484, "characteristics.90th_percentile_latency_ns": 23974840.0, "characteristics.90th_percentile_latency_s": 0.02397484, "characteristics.90th_percentile_latency_us": 23974.84, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "906341a6bea6b9e9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7815130, "90.00 percentile latency (ns)": 8686529, "90th percentile latency (ns)": 8686529, "95.00 percentile latency (ns)": 11469947, "97.00 percentile latency (ns)": 13051617, "99.00 percentile latency (ns)": 28629810, "99.90 percentile latency (ns)": 56285468, "Max latency (ns)": 294085972, "Mean latency (ns)": 8521242, "Min duration satisfied": "Yes", "Min latency (ns)": 6944051, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 117.24, "QPS w/o loadgen overhead": 117.35, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.686529, "characteristics.90th_percentile_latency_ns": 8686529.0, "characteristics.90th_percentile_latency_s": 0.008686529, "characteristics.90th_percentile_latency_us": 8686.529, "characteristics.accuracy": 59.232, "characteristics.good": 29616, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ae44289af6f2326c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6763838, "90.00 percentile latency (ns)": 7896781, "90th percentile latency (ns)": 7896781, "95.00 percentile latency (ns)": 10515452, "97.00 percentile latency (ns)": 11855350, "99.00 percentile latency (ns)": 22281261, "99.90 percentile latency (ns)": 46742263, "Max latency (ns)": 229195411, "Mean latency (ns)": 7504248, "Min duration satisfied": "Yes", "Min latency (ns)": 6315019, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 133.03, "QPS w/o loadgen overhead": 133.26, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.896781, "characteristics.90th_percentile_latency_ns": 7896781.0, "characteristics.90th_percentile_latency_s": 0.007896781, "characteristics.90th_percentile_latency_us": 7896.781, "characteristics.accuracy": 59.072, "characteristics.good": 29536, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "182c33ee5189171d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 17903396, "90.00 percentile latency (ns)": 22909300, "90th percentile latency (ns)": 22909300, "95.00 percentile latency (ns)": 25098203, "97.00 percentile latency (ns)": 27844025, "99.00 percentile latency (ns)": 36053264, "99.90 percentile latency (ns)": 57857635, "Max latency (ns)": 120572619, "Mean latency (ns)": 19231555, "Min duration satisfied": "Yes", "Min latency (ns)": 16846213, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 51.95, "QPS w/o loadgen overhead": 52.0, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.9093, "characteristics.90th_percentile_latency_ns": 22909300.0, "characteristics.90th_percentile_latency_s": 0.0229093, "characteristics.90th_percentile_latency_us": 22909.3, "characteristics.accuracy": 72.892, "characteristics.good": 36446, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "774fe9a9bdd3d007", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 18108314, "90.00 percentile latency (ns)": 24100213, "90th percentile latency (ns)": 24100213, "95.00 percentile latency (ns)": 26347475, "97.00 percentile latency (ns)": 28869822, "99.00 percentile latency (ns)": 38236871, "99.90 percentile latency (ns)": 49949110, "Max latency (ns)": 208702640, "Mean latency (ns)": 19425534, "Min duration satisfied": "Yes", "Min latency (ns)": 16156423, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 51.42, "QPS w/o loadgen overhead": 51.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.100213, "characteristics.90th_percentile_latency_ns": 24100213.0, "characteristics.90th_percentile_latency_s": 0.024100213, "characteristics.90th_percentile_latency_us": 24100.213, "characteristics.accuracy": 70.598, "characteristics.good": 35299, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bc83b11ede6fb032", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9219209, "90.00 percentile latency (ns)": 11215886, "90th percentile latency (ns)": 11215886, "95.00 percentile latency (ns)": 14107489, "97.00 percentile latency (ns)": 16087686, "99.00 percentile latency (ns)": 29826703, "99.90 percentile latency (ns)": 60496313, "Max latency (ns)": 176300606, "Mean latency (ns)": 10130068, "Min duration satisfied": "Yes", "Min latency (ns)": 7980433, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 98.58, "QPS w/o loadgen overhead": 98.72, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.215886, "characteristics.90th_percentile_latency_ns": 11215886.0, "characteristics.90th_percentile_latency_s": 0.011215886, "characteristics.90th_percentile_latency_us": 11215.886, "characteristics.accuracy": 56.522, "characteristics.good": 28261, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2a428ab25cbb8097", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11711570, "90.00 percentile latency (ns)": 13429532, "90th percentile latency (ns)": 13429532, "95.00 percentile latency (ns)": 16640356, "97.00 percentile latency (ns)": 18182341, "99.00 percentile latency (ns)": 28082410, "99.90 percentile latency (ns)": 43318035, "Max latency (ns)": 107207533, "Mean latency (ns)": 12225564, "Min duration satisfied": "Yes", "Min latency (ns)": 10029802, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 81.68, "QPS w/o loadgen overhead": 81.8, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.429532, "characteristics.90th_percentile_latency_ns": 13429532.0, "characteristics.90th_percentile_latency_s": 0.013429532, "characteristics.90th_percentile_latency_us": 13429.532, "characteristics.accuracy": 67.726, "characteristics.good": 33863, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4e008bb52206a539", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8521554, "90.00 percentile latency (ns)": 9756288, "90th percentile latency (ns)": 9756288, "95.00 percentile latency (ns)": 12542081, "97.00 percentile latency (ns)": 14123426, "99.00 percentile latency (ns)": 20863444, "99.90 percentile latency (ns)": 39097379, "Max latency (ns)": 82797573, "Mean latency (ns)": 9228577, "Min duration satisfied": "Yes", "Min latency (ns)": 8041445, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 108.2, "QPS w/o loadgen overhead": 108.36, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.756288, "characteristics.90th_percentile_latency_ns": 9756288.0, "characteristics.90th_percentile_latency_s": 0.009756288, "characteristics.90th_percentile_latency_us": 9756.288, "characteristics.accuracy": 63.442, "characteristics.good": 31721, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "04444e7f4144d398", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 71825590, "90.00 percentile latency (ns)": 86635280, "90th percentile latency (ns)": 86635280, "95.00 percentile latency (ns)": 90052369, "97.00 percentile latency (ns)": 92532357, "99.00 percentile latency (ns)": 110124866, "99.90 percentile latency (ns)": 157519001, "Max latency (ns)": 230687534, "Mean latency (ns)": 75122016, "Min duration satisfied": "Yes", "Min latency (ns)": 70742659, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 13.31, "QPS w/o loadgen overhead": 13.31, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 86.63528, "characteristics.90th_percentile_latency_ns": 86635280.0, "characteristics.90th_percentile_latency_s": 0.08663528, "characteristics.90th_percentile_latency_us": 86635.28, "characteristics.accuracy": 74.112, "characteristics.good": 37056, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8b5d1646d580c943", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10694592, "90.00 percentile latency (ns)": 12670618, "90th percentile latency (ns)": 12670618, "95.00 percentile latency (ns)": 15658975, "97.00 percentile latency (ns)": 17143362, "99.00 percentile latency (ns)": 31247866, "99.90 percentile latency (ns)": 65382743, "Max latency (ns)": 179764202, "Mean latency (ns)": 11639597, "Min duration satisfied": "Yes", "Min latency (ns)": 9600398, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 85.81, "QPS w/o loadgen overhead": 85.91, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.670618, "characteristics.90th_percentile_latency_ns": 12670618.0, "characteristics.90th_percentile_latency_s": 0.012670618, "characteristics.90th_percentile_latency_us": 12670.618, "characteristics.accuracy": 58.544, "characteristics.good": 29272, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6380d2a6291d72a3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 22358514, "90.00 percentile latency (ns)": 25565448, "90th percentile latency (ns)": 25565448, "95.00 percentile latency (ns)": 30411471, "97.00 percentile latency (ns)": 32780325, "99.00 percentile latency (ns)": 35351510, "99.90 percentile latency (ns)": 45810724, "Max latency (ns)": 49198745, "Mean latency (ns)": 22368668, "Min duration satisfied": "Yes", "Min latency (ns)": 8510411, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 44.64, "QPS w/o loadgen overhead": 44.71, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 25.565448, "characteristics.90th_percentile_latency_ns": 25565448.0, "characteristics.90th_percentile_latency_s": 0.025565448, "characteristics.90th_percentile_latency_us": 25565.448, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "93be4fdf9f143d4a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 29594929, "90.00 percentile latency (ns)": 33585293, "90th percentile latency (ns)": 33585293, "95.00 percentile latency (ns)": 35608013, "97.00 percentile latency (ns)": 38347629, "99.00 percentile latency (ns)": 42773918, "99.90 percentile latency (ns)": 48580367, "Max latency (ns)": 59373675, "Mean latency (ns)": 28805973, "Min duration satisfied": "Yes", "Min latency (ns)": 18010287, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 34.7, "QPS w/o loadgen overhead": 34.72, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.585293, "characteristics.90th_percentile_latency_ns": 33585293.0, "characteristics.90th_percentile_latency_s": 0.033585293, "characteristics.90th_percentile_latency_us": 33585.293, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6a182c80f4992bf9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14454597, "90.00 percentile latency (ns)": 17665165, "90th percentile latency (ns)": 17665165, "95.00 percentile latency (ns)": 20567176, "97.00 percentile latency (ns)": 22430839, "99.00 percentile latency (ns)": 32834865, "99.90 percentile latency (ns)": 46407344, "Max latency (ns)": 94786834, "Mean latency (ns)": 15233894, "Min duration satisfied": "Yes", "Min latency (ns)": 12752670, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 65.57, "QPS w/o loadgen overhead": 65.64, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.665165, "characteristics.90th_percentile_latency_ns": 17665165.0, "characteristics.90th_percentile_latency_s": 0.017665165, "characteristics.90th_percentile_latency_us": 17665.165, "characteristics.accuracy": 69.678, "characteristics.good": 34839, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "cfa84d5bd8e8c868", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16212166, "90.00 percentile latency (ns)": 20874152, "90th percentile latency (ns)": 20874152, "95.00 percentile latency (ns)": 23366543, "97.00 percentile latency (ns)": 25025108, "99.00 percentile latency (ns)": 35863034, "99.90 percentile latency (ns)": 52495950, "Max latency (ns)": 148823361, "Mean latency (ns)": 17255096, "Min duration satisfied": "Yes", "Min latency (ns)": 14006440, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 57.89, "QPS w/o loadgen overhead": 57.95, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.874152, "characteristics.90th_percentile_latency_ns": 20874152.0, "characteristics.90th_percentile_latency_s": 0.020874152, "characteristics.90th_percentile_latency_us": 20874.152, "characteristics.accuracy": 68.76, "characteristics.good": 34380, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "48e8c4fa790a9394", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8360425, "90.00 percentile latency (ns)": 9724138, "90th percentile latency (ns)": 9724138, "95.00 percentile latency (ns)": 10410889, "97.00 percentile latency (ns)": 11067752, "99.00 percentile latency (ns)": 13280625, "99.90 percentile latency (ns)": 20646283, "Max latency (ns)": 24587781, "Mean latency (ns)": 8303849, "Min duration satisfied": "Yes", "Min latency (ns)": 5803281, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 120.26, "QPS w/o loadgen overhead": 120.43, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.724138, "characteristics.90th_percentile_latency_ns": 9724138.0, "characteristics.90th_percentile_latency_s": 0.009724138, "characteristics.90th_percentile_latency_us": 9724.138, "characteristics.accuracy": 63.332, "characteristics.good": 31666, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "998d88d9502040a0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5204910, "90.00 percentile latency (ns)": 5679236, "90th percentile latency (ns)": 5679236, "95.00 percentile latency (ns)": 6438758, "97.00 percentile latency (ns)": 8214519, "99.00 percentile latency (ns)": 20012278, "99.90 percentile latency (ns)": 58203595, "Max latency (ns)": 157315959, "Mean latency (ns)": 5696625, "Min duration satisfied": "Yes", "Min latency (ns)": 4670614, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 175.33, "QPS w/o loadgen overhead": 175.54, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.679236, "characteristics.90th_percentile_latency_ns": 5679236.0, "characteristics.90th_percentile_latency_s": 0.005679236, "characteristics.90th_percentile_latency_us": 5679.236, "characteristics.accuracy": 43.454, "characteristics.good": 21727, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b739f5eac5402a7e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 52284156, "90.00 percentile latency (ns)": 88623563, "90th percentile latency (ns)": 88623563, "95.00 percentile latency (ns)": 93061148, "97.00 percentile latency (ns)": 95222626, "99.00 percentile latency (ns)": 108417743, "99.90 percentile latency (ns)": 113785131, "Max latency (ns)": 119064036, "Mean latency (ns)": 61307335, "Min duration satisfied": "Yes", "Min latency (ns)": 50270589, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 16.3, "QPS w/o loadgen overhead": 16.31, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 88.623563, "characteristics.90th_percentile_latency_ns": 88623563.0, "characteristics.90th_percentile_latency_s": 0.088623563, "characteristics.90th_percentile_latency_us": 88623.563, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0ef1e7d5646438f9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14650226, "90.00 percentile latency (ns)": 20389919, "90th percentile latency (ns)": 20389919, "95.00 percentile latency (ns)": 22197364, "97.00 percentile latency (ns)": 23132288, "99.00 percentile latency (ns)": 30674851, "99.90 percentile latency (ns)": 50055443, "Max latency (ns)": 170138981, "Mean latency (ns)": 15985944, "Min duration satisfied": "Yes", "Min latency (ns)": 13582239, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 62.49, "QPS w/o loadgen overhead": 62.55, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.389919, "characteristics.90th_percentile_latency_ns": 20389919.0, "characteristics.90th_percentile_latency_s": 0.020389919, "characteristics.90th_percentile_latency_us": 20389.919, "characteristics.accuracy": 70.33, "characteristics.good": 35165, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5a8f44f584d0e71e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13152489, "90.00 percentile latency (ns)": 16200848, "90th percentile latency (ns)": 16200848, "95.00 percentile latency (ns)": 18971179, "97.00 percentile latency (ns)": 21049798, "99.00 percentile latency (ns)": 32227735, "99.90 percentile latency (ns)": 76120181, "Max latency (ns)": 163141742, "Mean latency (ns)": 14187117, "Min duration satisfied": "Yes", "Min latency (ns)": 11296470, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 70.4, "QPS w/o loadgen overhead": 70.49, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.200848, "characteristics.90th_percentile_latency_ns": 16200848.0, "characteristics.90th_percentile_latency_s": 0.016200848, "characteristics.90th_percentile_latency_us": 16200.848, "characteristics.accuracy": 67.4, "characteristics.good": 33700, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "29bbd08e04cde900", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 19089038, "90.00 percentile latency (ns)": 21674912, "90th percentile latency (ns)": 21674912, "95.00 percentile latency (ns)": 26503031, "97.00 percentile latency (ns)": 28272581, "99.00 percentile latency (ns)": 32013098, "99.90 percentile latency (ns)": 41510094, "Max latency (ns)": 51354723, "Mean latency (ns)": 19180413, "Min duration satisfied": "Yes", "Min latency (ns)": 7659955, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 52.05, "QPS w/o loadgen overhead": 52.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.674912, "characteristics.90th_percentile_latency_ns": 21674912.0, "characteristics.90th_percentile_latency_s": 0.021674912, "characteristics.90th_percentile_latency_us": 21674.912, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0286448f0b7c6ecd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5284076, "90.00 percentile latency (ns)": 6101200, "90th percentile latency (ns)": 6101200, "95.00 percentile latency (ns)": 8198221, "97.00 percentile latency (ns)": 8965360, "99.00 percentile latency (ns)": 16842928, "99.90 percentile latency (ns)": 57474436, "Max latency (ns)": 108013773, "Mean latency (ns)": 5911733, "Min duration satisfied": "Yes", "Min latency (ns)": 4869785, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 168.97, "QPS w/o loadgen overhead": 169.16, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.1012, "characteristics.90th_percentile_latency_ns": 6101200.0, "characteristics.90th_percentile_latency_s": 0.0061012, "characteristics.90th_percentile_latency_us": 6101.2, "characteristics.accuracy": 49.296, "characteristics.good": 24648, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8df970539d8b7e62", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8452120, "90.00 percentile latency (ns)": 9484872, "90th percentile latency (ns)": 9484872, "95.00 percentile latency (ns)": 12098827, "97.00 percentile latency (ns)": 13732372, "99.00 percentile latency (ns)": 23414024, "99.90 percentile latency (ns)": 52875960, "Max latency (ns)": 228006255, "Mean latency (ns)": 9061915, "Min duration satisfied": "Yes", "Min latency (ns)": 7447719, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 110.19, "QPS w/o loadgen overhead": 110.35, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.484872, "characteristics.90th_percentile_latency_ns": 9484872.0, "characteristics.90th_percentile_latency_s": 0.009484872, "characteristics.90th_percentile_latency_us": 9484.872, "characteristics.accuracy": 62.082, "characteristics.good": 31041, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2ae2e92240708385", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 17852945, "90.00 percentile latency (ns)": 20085807, "90th percentile latency (ns)": 20085807, "95.00 percentile latency (ns)": 24215134, "97.00 percentile latency (ns)": 26007817, "99.00 percentile latency (ns)": 29151597, "99.90 percentile latency (ns)": 37146016, "Max latency (ns)": 43881339, "Mean latency (ns)": 18256143, "Min duration satisfied": "Yes", "Min latency (ns)": 12406667, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 54.68, "QPS w/o loadgen overhead": 54.78, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.085807, "characteristics.90th_percentile_latency_ns": 20085807.0, "characteristics.90th_percentile_latency_s": 0.020085807, "characteristics.90th_percentile_latency_us": 20085.807, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b73ade438fc54353", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 53780064, "90.00 percentile latency (ns)": 62113179, "90th percentile latency (ns)": 62113179, "95.00 percentile latency (ns)": 67437437, "97.00 percentile latency (ns)": 70439044, "99.00 percentile latency (ns)": 74684788, "99.90 percentile latency (ns)": 85995207, "Max latency (ns)": 88167440, "Mean latency (ns)": 53161486, "Min duration satisfied": "Yes", "Min latency (ns)": 28166817, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 18.8, "QPS w/o loadgen overhead": 18.81, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 62.113179, "characteristics.90th_percentile_latency_ns": 62113179.0, "characteristics.90th_percentile_latency_s": 0.062113179, "characteristics.90th_percentile_latency_us": 62113.179, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "fe03004d6aaf05a0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8882242, "90.00 percentile latency (ns)": 10477229, "90th percentile latency (ns)": 10477229, "95.00 percentile latency (ns)": 12280802, "97.00 percentile latency (ns)": 13721030, "99.00 percentile latency (ns)": 26070826, "99.90 percentile latency (ns)": 54382367, "Max latency (ns)": 162883887, "Mean latency (ns)": 9617984, "Min duration satisfied": "Yes", "Min latency (ns)": 8409259, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 103.81, "QPS w/o loadgen overhead": 103.97, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.477229, "characteristics.90th_percentile_latency_ns": 10477229.0, "characteristics.90th_percentile_latency_s": 0.010477229, "characteristics.90th_percentile_latency_us": 10477.229, "characteristics.accuracy": 63.882, "characteristics.good": 31941, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "42d4f4f9330dea48", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 38449650, "90.00 percentile latency (ns)": 42866274, "90th percentile latency (ns)": 42866274, "95.00 percentile latency (ns)": 45642694, "97.00 percentile latency (ns)": 48465226, "99.00 percentile latency (ns)": 53123846, "99.90 percentile latency (ns)": 59786047, "Max latency (ns)": 61438605, "Mean latency (ns)": 37609506, "Min duration satisfied": "Yes", "Min latency (ns)": 22991291, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 26.58, "QPS w/o loadgen overhead": 26.59, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.866274, "characteristics.90th_percentile_latency_ns": 42866274.0, "characteristics.90th_percentile_latency_s": 0.042866274, "characteristics.90th_percentile_latency_us": 42866.274, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5b0912a5e3d32a39", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6646294, "90.00 percentile latency (ns)": 7342263, "90th percentile latency (ns)": 7342263, "95.00 percentile latency (ns)": 9490331, "97.00 percentile latency (ns)": 11247469, "99.00 percentile latency (ns)": 21134841, "99.90 percentile latency (ns)": 58113491, "Max latency (ns)": 240137761, "Mean latency (ns)": 7156838, "Min duration satisfied": "Yes", "Min latency (ns)": 5889905, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 139.52, "QPS w/o loadgen overhead": 139.73, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.342263, "characteristics.90th_percentile_latency_ns": 7342263.0, "characteristics.90th_percentile_latency_s": 0.007342263, "characteristics.90th_percentile_latency_us": 7342.263, "characteristics.accuracy": 57.054, "characteristics.good": 28527, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1034408b974c2413", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 57482794, "90.00 percentile latency (ns)": 65837594, "90th percentile latency (ns)": 65837594, "95.00 percentile latency (ns)": 71698657, "97.00 percentile latency (ns)": 74102852, "99.00 percentile latency (ns)": 78095934, "99.90 percentile latency (ns)": 85249329, "Max latency (ns)": 89388025, "Mean latency (ns)": 55780093, "Min duration satisfied": "Yes", "Min latency (ns)": 19450096, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 17.92, "QPS w/o loadgen overhead": 17.93, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 65.837594, "characteristics.90th_percentile_latency_ns": 65837594.0, "characteristics.90th_percentile_latency_s": 0.065837594, "characteristics.90th_percentile_latency_us": 65837.594, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7a3b25635474497b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13792872, "90.00 percentile latency (ns)": 15571033, "90th percentile latency (ns)": 15571033, "95.00 percentile latency (ns)": 17394026, "97.00 percentile latency (ns)": 19902362, "99.00 percentile latency (ns)": 24781749, "99.90 percentile latency (ns)": 33315569, "Max latency (ns)": 35672445, "Mean latency (ns)": 14127881, "Min duration satisfied": "Yes", "Min latency (ns)": 6521188, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 70.61, "QPS w/o loadgen overhead": 70.78, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.571033, "characteristics.90th_percentile_latency_ns": 15571033.0, "characteristics.90th_percentile_latency_s": 0.015571033, "characteristics.90th_percentile_latency_us": 15571.033, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b8270189d673fe7a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16992862, "90.00 percentile latency (ns)": 18983031, "90th percentile latency (ns)": 18983031, "95.00 percentile latency (ns)": 20416617, "97.00 percentile latency (ns)": 21985401, "99.00 percentile latency (ns)": 24948778, "99.90 percentile latency (ns)": 30074066, "Max latency (ns)": 33147154, "Mean latency (ns)": 16948554, "Min duration satisfied": "Yes", "Min latency (ns)": 10945587, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 58.94, "QPS w/o loadgen overhead": 59.0, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.983031, "characteristics.90th_percentile_latency_ns": 18983031.0, "characteristics.90th_percentile_latency_s": 0.018983031, "characteristics.90th_percentile_latency_us": 18983.031, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9e2b449a39924465", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16151220, "90.00 percentile latency (ns)": 18136247, "90th percentile latency (ns)": 18136247, "95.00 percentile latency (ns)": 21476557, "97.00 percentile latency (ns)": 23790080, "99.00 percentile latency (ns)": 26733418, "99.90 percentile latency (ns)": 33826769, "Max latency (ns)": 37739624, "Mean latency (ns)": 16591692, "Min duration satisfied": "Yes", "Min latency (ns)": 11882255, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 60.14, "QPS w/o loadgen overhead": 60.27, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.136247, "characteristics.90th_percentile_latency_ns": 18136247.0, "characteristics.90th_percentile_latency_s": 0.018136247, "characteristics.90th_percentile_latency_us": 18136.247, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9408f234b67d2d64", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10373672, "90.00 percentile latency (ns)": 11870415, "90th percentile latency (ns)": 11870415, "95.00 percentile latency (ns)": 12483147, "97.00 percentile latency (ns)": 13682691, "99.00 percentile latency (ns)": 16036210, "99.90 percentile latency (ns)": 22159283, "Max latency (ns)": 24988696, "Mean latency (ns)": 10212933, "Min duration satisfied": "Yes", "Min latency (ns)": 7486592, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 97.77, "QPS w/o loadgen overhead": 97.92, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.870415, "characteristics.90th_percentile_latency_ns": 11870415.0, "characteristics.90th_percentile_latency_s": 0.011870415, "characteristics.90th_percentile_latency_us": 11870.415, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "841a6961f532f41e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 29129615, "90.00 percentile latency (ns)": 34129454, "90th percentile latency (ns)": 34129454, "95.00 percentile latency (ns)": 39421817, "97.00 percentile latency (ns)": 42039502, "99.00 percentile latency (ns)": 46833635, "99.90 percentile latency (ns)": 52254486, "Max latency (ns)": 58765687, "Mean latency (ns)": 28650351, "Min duration satisfied": "Yes", "Min latency (ns)": 10932390, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 34.86, "QPS w/o loadgen overhead": 34.9, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 34.129454, "characteristics.90th_percentile_latency_ns": 34129454.0, "characteristics.90th_percentile_latency_s": 0.034129454, "characteristics.90th_percentile_latency_us": 34129.454, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "401cbdbed19c0950", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 33216891, "90.00 percentile latency (ns)": 40255334, "90th percentile latency (ns)": 40255334, "95.00 percentile latency (ns)": 46946689, "97.00 percentile latency (ns)": 49789511, "99.00 percentile latency (ns)": 54953210, "99.90 percentile latency (ns)": 86307453, "Max latency (ns)": 94016168, "Mean latency (ns)": 35131687, "Min duration satisfied": "Yes", "Min latency (ns)": 32466584, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 28.45, "QPS w/o loadgen overhead": 28.46, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.255334, "characteristics.90th_percentile_latency_ns": 40255334.0, "characteristics.90th_percentile_latency_s": 0.040255334, "characteristics.90th_percentile_latency_us": 40255.334, "characteristics.accuracy": 71.274, "characteristics.good": 35637, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3a2e10779274a7b9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 51581469, "90.00 percentile latency (ns)": 59164897, "90th percentile latency (ns)": 59164897, "95.00 percentile latency (ns)": 61717850, "97.00 percentile latency (ns)": 63778906, "99.00 percentile latency (ns)": 71195800, "99.90 percentile latency (ns)": 79590307, "Max latency (ns)": 80749338, "Mean latency (ns)": 46844037, "Min duration satisfied": "Yes", "Min latency (ns)": 32054981, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 21.34, "QPS w/o loadgen overhead": 21.35, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 59.164897, "characteristics.90th_percentile_latency_ns": 59164897.0, "characteristics.90th_percentile_latency_s": 0.059164897, "characteristics.90th_percentile_latency_us": 59164.897, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c2811a4c564c407d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9744330, "90.00 percentile latency (ns)": 11556896, "90th percentile latency (ns)": 11556896, "95.00 percentile latency (ns)": 12242208, "97.00 percentile latency (ns)": 13040678, "99.00 percentile latency (ns)": 15617150, "99.90 percentile latency (ns)": 23688987, "Max latency (ns)": 26194993, "Mean latency (ns)": 9730157, "Min duration satisfied": "Yes", "Min latency (ns)": 7170513, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 102.6, "QPS w/o loadgen overhead": 102.77, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.556896, "characteristics.90th_percentile_latency_ns": 11556896.0, "characteristics.90th_percentile_latency_s": 0.011556896, "characteristics.90th_percentile_latency_us": 11556.896, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "68486dbd60600bd8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 98917712, "90.00 percentile latency (ns)": 115901776, "90th percentile latency (ns)": 115901776, "95.00 percentile latency (ns)": 120466215, "97.00 percentile latency (ns)": 127038172, "99.00 percentile latency (ns)": 146899523, "99.90 percentile latency (ns)": 211451330, "Max latency (ns)": 212719582, "Mean latency (ns)": 103109553, "Min duration satisfied": "Yes", "Min latency (ns)": 97356391, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 9.7, "QPS w/o loadgen overhead": 9.7, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 115.901776, "characteristics.90th_percentile_latency_ns": 115901776.0, "characteristics.90th_percentile_latency_s": 0.115901776, "characteristics.90th_percentile_latency_us": 115901.776, "characteristics.accuracy": 76.35, "characteristics.good": 38175, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f890c899c4f29b26", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7563981, "90.00 percentile latency (ns)": 8408531, "90th percentile latency (ns)": 8408531, "95.00 percentile latency (ns)": 10928130, "97.00 percentile latency (ns)": 12621261, "99.00 percentile latency (ns)": 26524466, "99.90 percentile latency (ns)": 60916639, "Max latency (ns)": 138546851, "Mean latency (ns)": 8243890, "Min duration satisfied": "Yes", "Min latency (ns)": 6806669, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 121.15, "QPS w/o loadgen overhead": 121.3, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.408531, "characteristics.90th_percentile_latency_ns": 8408531.0, "characteristics.90th_percentile_latency_s": 0.008408531, "characteristics.90th_percentile_latency_us": 8408.531, "characteristics.accuracy": 54.504, "characteristics.good": 27252, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "74c2c8ffb1d3e512", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 18719441, "90.00 percentile latency (ns)": 22277752, "90th percentile latency (ns)": 22277752, "95.00 percentile latency (ns)": 23532883, "97.00 percentile latency (ns)": 24998104, "99.00 percentile latency (ns)": 29050390, "99.90 percentile latency (ns)": 34390162, "Max latency (ns)": 38507444, "Mean latency (ns)": 18647635, "Min duration satisfied": "Yes", "Min latency (ns)": 12284546, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 53.59, "QPS w/o loadgen overhead": 53.63, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.277752, "characteristics.90th_percentile_latency_ns": 22277752.0, "characteristics.90th_percentile_latency_s": 0.022277752, "characteristics.90th_percentile_latency_us": 22277.752, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b204a78a3bc52673", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 25825254, "90.00 percentile latency (ns)": 29406235, "90th percentile latency (ns)": 29406235, "95.00 percentile latency (ns)": 33123155, "97.00 percentile latency (ns)": 36441850, "99.00 percentile latency (ns)": 39886311, "99.90 percentile latency (ns)": 50598013, "Max latency (ns)": 58174137, "Mean latency (ns)": 24747709, "Min duration satisfied": "Yes", "Min latency (ns)": 9920216, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 40.36, "QPS w/o loadgen overhead": 40.41, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.406235, "characteristics.90th_percentile_latency_ns": 29406235.0, "characteristics.90th_percentile_latency_s": 0.029406235, "characteristics.90th_percentile_latency_us": 29406.235, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "90b408359f343855", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 34456920, "90.00 percentile latency (ns)": 40151972, "90th percentile latency (ns)": 40151972, "95.00 percentile latency (ns)": 45527399, "97.00 percentile latency (ns)": 48457632, "99.00 percentile latency (ns)": 51959471, "99.90 percentile latency (ns)": 66162466, "Max latency (ns)": 68362335, "Mean latency (ns)": 33013997, "Min duration satisfied": "Yes", "Min latency (ns)": 13253671, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 30.26, "QPS w/o loadgen overhead": 30.29, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.151972, "characteristics.90th_percentile_latency_ns": 40151972.0, "characteristics.90th_percentile_latency_s": 0.040151972, "characteristics.90th_percentile_latency_us": 40151.972, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e4b12bc5ad5df73a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 22074543, "90.00 percentile latency (ns)": 25524330, "90th percentile latency (ns)": 25524330, "95.00 percentile latency (ns)": 30081591, "97.00 percentile latency (ns)": 32189852, "99.00 percentile latency (ns)": 35420942, "99.90 percentile latency (ns)": 43629414, "Max latency (ns)": 53218869, "Mean latency (ns)": 21764851, "Min duration satisfied": "Yes", "Min latency (ns)": 8597863, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 45.89, "QPS w/o loadgen overhead": 45.95, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 25.52433, "characteristics.90th_percentile_latency_ns": 25524330.0, "characteristics.90th_percentile_latency_s": 0.02552433, "characteristics.90th_percentile_latency_us": 25524.33, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "045074b8f84c71e7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15315441, "90.00 percentile latency (ns)": 18491366, "90th percentile latency (ns)": 18491366, "95.00 percentile latency (ns)": 19672061, "97.00 percentile latency (ns)": 21118689, "99.00 percentile latency (ns)": 24763885, "99.90 percentile latency (ns)": 31541292, "Max latency (ns)": 45487549, "Mean latency (ns)": 15055055, "Min duration satisfied": "Yes", "Min latency (ns)": 10080411, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 66.36, "QPS w/o loadgen overhead": 66.42, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.491366, "characteristics.90th_percentile_latency_ns": 18491366.0, "characteristics.90th_percentile_latency_s": 0.018491366, "characteristics.90th_percentile_latency_us": 18491.366, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "58aad9c8d40a4cb6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10508966, "90.00 percentile latency (ns)": 13192370, "90th percentile latency (ns)": 13192370, "95.00 percentile latency (ns)": 15790140, "97.00 percentile latency (ns)": 17940433, "99.00 percentile latency (ns)": 29419581, "99.90 percentile latency (ns)": 57854489, "Max latency (ns)": 139326538, "Mean latency (ns)": 11382443, "Min duration satisfied": "Yes", "Min latency (ns)": 9172881, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 87.74, "QPS w/o loadgen overhead": 87.85, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.19237, "characteristics.90th_percentile_latency_ns": 13192370.0, "characteristics.90th_percentile_latency_s": 0.01319237, "characteristics.90th_percentile_latency_us": 13192.37, "characteristics.accuracy": 65.004, "characteristics.good": 32502, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "37c3020b4a018aa3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 40585127, "90.00 percentile latency (ns)": 47243098, "90th percentile latency (ns)": 47243098, "95.00 percentile latency (ns)": 52324787, "97.00 percentile latency (ns)": 56018926, "99.00 percentile latency (ns)": 59824520, "99.90 percentile latency (ns)": 70180858, "Max latency (ns)": 77405901, "Mean latency (ns)": 40647695, "Min duration satisfied": "Yes", "Min latency (ns)": 14650854, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 24.58, "QPS w/o loadgen overhead": 24.6, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 47.243098, "characteristics.90th_percentile_latency_ns": 47243098.0, "characteristics.90th_percentile_latency_s": 0.047243098, "characteristics.90th_percentile_latency_us": 47243.098, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2cd294172a6f7401", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 24141951, "90.00 percentile latency (ns)": 28143391, "90th percentile latency (ns)": 28143391, "95.00 percentile latency (ns)": 33490290, "97.00 percentile latency (ns)": 35222608, "99.00 percentile latency (ns)": 39344638, "99.90 percentile latency (ns)": 45713299, "Max latency (ns)": 50951792, "Mean latency (ns)": 23897921, "Min duration satisfied": "Yes", "Min latency (ns)": 9368819, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 41.78, "QPS w/o loadgen overhead": 41.84, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.143391, "characteristics.90th_percentile_latency_ns": 28143391.0, "characteristics.90th_percentile_latency_s": 0.028143391, "characteristics.90th_percentile_latency_us": 28143.391, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a13eb338c1745c28", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12541826, "90.00 percentile latency (ns)": 14132811, "90th percentile latency (ns)": 14132811, "95.00 percentile latency (ns)": 15777462, "97.00 percentile latency (ns)": 17985631, "99.00 percentile latency (ns)": 23114376, "99.90 percentile latency (ns)": 32926804, "Max latency (ns)": 36504725, "Mean latency (ns)": 12885032, "Min duration satisfied": "Yes", "Min latency (ns)": 6945632, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 77.43, "QPS w/o loadgen overhead": 77.61, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.132811, "characteristics.90th_percentile_latency_ns": 14132811.0, "characteristics.90th_percentile_latency_s": 0.014132811, "characteristics.90th_percentile_latency_us": 14132.811, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d46d65074866a332", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 17389696, "90.00 percentile latency (ns)": 19617987, "90th percentile latency (ns)": 19617987, "95.00 percentile latency (ns)": 23220675, "97.00 percentile latency (ns)": 25137142, "99.00 percentile latency (ns)": 28659282, "99.90 percentile latency (ns)": 34588089, "Max latency (ns)": 41430502, "Mean latency (ns)": 17502211, "Min duration satisfied": "Yes", "Min latency (ns)": 7311651, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 57.04, "QPS w/o loadgen overhead": 57.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.617987, "characteristics.90th_percentile_latency_ns": 19617987.0, "characteristics.90th_percentile_latency_s": 0.019617987, "characteristics.90th_percentile_latency_us": 19617.987, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b0f48988aea83d68", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6423078, "90.00 percentile latency (ns)": 7264584, "90th percentile latency (ns)": 7264584, "95.00 percentile latency (ns)": 9517702, "97.00 percentile latency (ns)": 10711414, "99.00 percentile latency (ns)": 24088315, "99.90 percentile latency (ns)": 58374359, "Max latency (ns)": 155625726, "Mean latency (ns)": 7003517, "Min duration satisfied": "Yes", "Min latency (ns)": 5727690, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 142.61, "QPS w/o loadgen overhead": 142.79, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.264584, "characteristics.90th_percentile_latency_ns": 7264584.0, "characteristics.90th_percentile_latency_s": 0.007264584, "characteristics.90th_percentile_latency_us": 7264.584, "characteristics.accuracy": 55.51, "characteristics.good": 27755, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5a95187a74b2ab24", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20114050, "90.00 percentile latency (ns)": 23162241, "90th percentile latency (ns)": 23162241, "95.00 percentile latency (ns)": 27184840, "97.00 percentile latency (ns)": 29089067, "99.00 percentile latency (ns)": 32253985, "99.90 percentile latency (ns)": 41088733, "Max latency (ns)": 43425545, "Mean latency (ns)": 20276338, "Min duration satisfied": "Yes", "Min latency (ns)": 8339525, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 49.25, "QPS w/o loadgen overhead": 49.32, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.162241, "characteristics.90th_percentile_latency_ns": 23162241.0, "characteristics.90th_percentile_latency_s": 0.023162241, "characteristics.90th_percentile_latency_us": 23162.241, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a0e894684ca3b28d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 74355637, "90.00 percentile latency (ns)": 93799867, "90th percentile latency (ns)": 93799867, "95.00 percentile latency (ns)": 98647421, "97.00 percentile latency (ns)": 102130136, "99.00 percentile latency (ns)": 111883945, "99.90 percentile latency (ns)": 139812291, "Max latency (ns)": 228363447, "Mean latency (ns)": 80070708, "Min duration satisfied": "Yes", "Min latency (ns)": 72867819, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 12.48, "QPS w/o loadgen overhead": 12.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 93.799867, "characteristics.90th_percentile_latency_ns": 93799867.0, "characteristics.90th_percentile_latency_s": 0.093799867, "characteristics.90th_percentile_latency_us": 93799.867, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "51a614727911e5c9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29984182, "90.00 percentile latency (ns)": 42392315, "90th percentile latency (ns)": 42392315, "95.00 percentile latency (ns)": 48921160, "97.00 percentile latency (ns)": 53287428, "99.00 percentile latency (ns)": 62851073, "99.90 percentile latency (ns)": 77593206, "Max latency (ns)": 83633101, "Mean latency (ns)": 32871593, "Min duration satisfied": "Yes", "Min latency (ns)": 29500044, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 30.37, "QPS w/o loadgen overhead": 30.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.392315, "characteristics.90th_percentile_latency_ns": 42392315.0, "characteristics.90th_percentile_latency_s": 0.042392315, "characteristics.90th_percentile_latency_us": 42392.315, "characteristics.accuracy": 72.9, "characteristics.good": 36450, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a42d78874f71983c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 17751359, "90.00 percentile latency (ns)": 22480848, "90th percentile latency (ns)": 22480848, "95.00 percentile latency (ns)": 28556555, "97.00 percentile latency (ns)": 31084310, "99.00 percentile latency (ns)": 39178669, "99.90 percentile latency (ns)": 68210466, "Max latency (ns)": 110066196, "Mean latency (ns)": 19255839, "Min duration satisfied": "Yes", "Min latency (ns)": 17248446, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 51.72, "QPS w/o loadgen overhead": 51.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.480848, "characteristics.90th_percentile_latency_ns": 22480848.0, "characteristics.90th_percentile_latency_s": 0.022480848, "characteristics.90th_percentile_latency_us": 22480.848, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a652ffc5407f9832", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 23353357, "90.00 percentile latency (ns)": 33179250, "90th percentile latency (ns)": 33179250, "95.00 percentile latency (ns)": 38615423, "97.00 percentile latency (ns)": 43084336, "99.00 percentile latency (ns)": 52561945, "99.90 percentile latency (ns)": 63722564, "Max latency (ns)": 202698968, "Mean latency (ns)": 25596710, "Min duration satisfied": "Yes", "Min latency (ns)": 22889016, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 38.96, "QPS w/o loadgen overhead": 39.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.17925, "characteristics.90th_percentile_latency_ns": 33179250.0, "characteristics.90th_percentile_latency_s": 0.03317925, "characteristics.90th_percentile_latency_us": 33179.25, "characteristics.accuracy": 70.338, "characteristics.good": 35169, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "944b7a074821f4e1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11812536, "90.00 percentile latency (ns)": 14594267, "90th percentile latency (ns)": 14594267, "95.00 percentile latency (ns)": 22818462, "97.00 percentile latency (ns)": 26567577, "99.00 percentile latency (ns)": 35367055, "99.90 percentile latency (ns)": 56689774, "Max latency (ns)": 129954989, "Mean latency (ns)": 13114084, "Min duration satisfied": "Yes", "Min latency (ns)": 11434174, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 75.94, "QPS w/o loadgen overhead": 76.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.594267, "characteristics.90th_percentile_latency_ns": 14594267.0, "characteristics.90th_percentile_latency_s": 0.014594267, "characteristics.90th_percentile_latency_us": 14594.267, "characteristics.accuracy": 64.418, "characteristics.good": 32209, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2b41ab92b395f092", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 42811934, "90.00 percentile latency (ns)": 57359443, "90th percentile latency (ns)": 57359443, "95.00 percentile latency (ns)": 64580365, "97.00 percentile latency (ns)": 66681001, "99.00 percentile latency (ns)": 75313908, "99.90 percentile latency (ns)": 155474275, "Max latency (ns)": 163795894, "Mean latency (ns)": 46439928, "Min duration satisfied": "Yes", "Min latency (ns)": 42215300, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 21.51, "QPS w/o loadgen overhead": 21.53, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 57.359443, "characteristics.90th_percentile_latency_ns": 57359443.0, "characteristics.90th_percentile_latency_s": 0.057359443, "characteristics.90th_percentile_latency_us": 57359.443, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "10a4b36df054d2c9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21764975, "90.00 percentile latency (ns)": 29101554, "90th percentile latency (ns)": 29101554, "95.00 percentile latency (ns)": 34129340, "97.00 percentile latency (ns)": 37709548, "99.00 percentile latency (ns)": 44673654, "99.90 percentile latency (ns)": 82205114, "Max latency (ns)": 110698006, "Mean latency (ns)": 23600753, "Min duration satisfied": "Yes", "Min latency (ns)": 21119525, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 42.25, "QPS w/o loadgen overhead": 42.37, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.101554, "characteristics.90th_percentile_latency_ns": 29101554.0, "characteristics.90th_percentile_latency_s": 0.029101554, "characteristics.90th_percentile_latency_us": 29101.554, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6e0da7d4f4309877", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 36381877, "90.00 percentile latency (ns)": 51871664, "90th percentile latency (ns)": 51871664, "95.00 percentile latency (ns)": 58639970, "97.00 percentile latency (ns)": 62355605, "99.00 percentile latency (ns)": 71117938, "99.90 percentile latency (ns)": 95779975, "Max latency (ns)": 200837511, "Mean latency (ns)": 40177441, "Min duration satisfied": "Yes", "Min latency (ns)": 35862332, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 24.84, "QPS w/o loadgen overhead": 24.89, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 51.871664, "characteristics.90th_percentile_latency_ns": 51871664.0, "characteristics.90th_percentile_latency_s": 0.051871664, "characteristics.90th_percentile_latency_us": 51871.664, "characteristics.accuracy": 71.23, "characteristics.good": 35615, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2432cb665c174a1b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19048440, "90.00 percentile latency (ns)": 25347439, "90th percentile latency (ns)": 25347439, "95.00 percentile latency (ns)": 30888753, "97.00 percentile latency (ns)": 34997544, "99.00 percentile latency (ns)": 43206869, "99.90 percentile latency (ns)": 77160420, "Max latency (ns)": 144439277, "Mean latency (ns)": 20743171, "Min duration satisfied": "Yes", "Min latency (ns)": 18546080, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 48.07, "QPS w/o loadgen overhead": 48.21, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 25.347439, "characteristics.90th_percentile_latency_ns": 25347439.0, "characteristics.90th_percentile_latency_s": 0.025347439, "characteristics.90th_percentile_latency_us": 25347.439, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2f2487342708cf47", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 53623864, "90.00 percentile latency (ns)": 69946553, "90th percentile latency (ns)": 69946553, "95.00 percentile latency (ns)": 75819767, "97.00 percentile latency (ns)": 79395627, "99.00 percentile latency (ns)": 86839192, "99.90 percentile latency (ns)": 95310936, "Max latency (ns)": 226861462, "Mean latency (ns)": 57934959, "Min duration satisfied": "Yes", "Min latency (ns)": 52702460, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 17.24, "QPS w/o loadgen overhead": 17.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 69.946553, "characteristics.90th_percentile_latency_ns": 69946553.0, "characteristics.90th_percentile_latency_s": 0.069946553, "characteristics.90th_percentile_latency_us": 69946.553, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "84e0e87e254c3327", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 45374355, "90.00 percentile latency (ns)": 61206222, "90th percentile latency (ns)": 61206222, "95.00 percentile latency (ns)": 67677607, "97.00 percentile latency (ns)": 70597149, "99.00 percentile latency (ns)": 78363799, "99.90 percentile latency (ns)": 145076410, "Max latency (ns)": 149209794, "Mean latency (ns)": 49265520, "Min duration satisfied": "Yes", "Min latency (ns)": 44631096, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 20.27, "QPS w/o loadgen overhead": 20.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 61.206222, "characteristics.90th_percentile_latency_ns": 61206222.0, "characteristics.90th_percentile_latency_s": 0.061206222, "characteristics.90th_percentile_latency_us": 61206.222, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b68929764ccda5fc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 328318216, "90.00 percentile latency (ns)": 425805975, "90th percentile latency (ns)": 425805975, "95.00 percentile latency (ns)": 439129333, "97.00 percentile latency (ns)": 449658810, "99.00 percentile latency (ns)": 466009798, "99.90 percentile latency (ns)": 476398984, "Max latency (ns)": 492074637, "Mean latency (ns)": 311631039, "Min duration satisfied": "Yes", "Min latency (ns)": 176591068, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 3.21, "QPS w/o loadgen overhead": 3.21, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 425.805975, "characteristics.90th_percentile_latency_ns": 425805975.0, "characteristics.90th_percentile_latency_s": 0.425805975, "characteristics.90th_percentile_latency_us": 425805.975, "characteristics.accuracy": 78.504, "characteristics.good": 39252, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "quantized-efficientnet-lite4", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "quantized-efficientnet-lite4", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "412e98341e99f009", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 117701552, "90.00 percentile latency (ns)": 270846085, "90th percentile latency (ns)": 270846085, "95.00 percentile latency (ns)": 298050928, "97.00 percentile latency (ns)": 310417908, "99.00 percentile latency (ns)": 327677193, "99.90 percentile latency (ns)": 335640707, "Max latency (ns)": 346140140, "Mean latency (ns)": 152340467, "Min duration satisfied": "Yes", "Min latency (ns)": 103454066, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 6.57, "QPS w/o loadgen overhead": 6.56, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 270.846085, "characteristics.90th_percentile_latency_ns": 270846085.0, "characteristics.90th_percentile_latency_s": 0.270846085, "characteristics.90th_percentile_latency_us": 270846.085, "characteristics.accuracy": 76.374, "characteristics.good": 38187, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "quantized-efficientnet-lite3", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "quantized-efficientnet-lite3", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f02776be1e7b4b99", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 328315490, "90.00 percentile latency (ns)": 378377258, "90th percentile latency (ns)": 378377258, "95.00 percentile latency (ns)": 387035481, "97.00 percentile latency (ns)": 392440675, "99.00 percentile latency (ns)": 400984688, "99.90 percentile latency (ns)": 415618283, "Max latency (ns)": 421938928, "Mean latency (ns)": 324021505, "Min duration satisfied": "Yes", "Min latency (ns)": 176393048, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 3.09, "QPS w/o loadgen overhead": 3.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 378.377258, "characteristics.90th_percentile_latency_ns": 378377258.0, "characteristics.90th_percentile_latency_s": 0.378377258, "characteristics.90th_percentile_latency_us": 378377.258, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "non-quantized-efficientnet-lite3", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "non-quantized-efficientnet-lite3", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4b55464b2191fc31", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 102975731, "90.00 percentile latency (ns)": 153980742, "90th percentile latency (ns)": 153980742, "95.00 percentile latency (ns)": 222861617, "97.00 percentile latency (ns)": 259065518, "99.00 percentile latency (ns)": 278703888, "99.90 percentile latency (ns)": 295328335, "Max latency (ns)": 306682356, "Mean latency (ns)": 114924813, "Min duration satisfied": "Yes", "Min latency (ns)": 88825788, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 8.7, "QPS w/o loadgen overhead": 8.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 153.980742, "characteristics.90th_percentile_latency_ns": 153980742.0, "characteristics.90th_percentile_latency_s": 0.153980742, "characteristics.90th_percentile_latency_us": 153980.742, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "non-quantized-efficientnet-lite1", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "non-quantized-efficientnet-lite1", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "845f990a764b48d6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 90037672, "90.00 percentile latency (ns)": 241031171, "90th percentile latency (ns)": 241031171, "95.00 percentile latency (ns)": 257014240, "97.00 percentile latency (ns)": 262846716, "99.00 percentile latency (ns)": 271990779, "99.90 percentile latency (ns)": 282931209, "Max latency (ns)": 288256476, "Mean latency (ns)": 128164909, "Min duration satisfied": "Yes", "Min latency (ns)": 71307388, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 7.8, "QPS w/o loadgen overhead": 7.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 241.031171, "characteristics.90th_percentile_latency_ns": 241031171.0, "characteristics.90th_percentile_latency_s": 0.241031171, "characteristics.90th_percentile_latency_us": 241031.171, "characteristics.accuracy": 74.068, "characteristics.good": 37034, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "quantized-efficientnet-lite2", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "quantized-efficientnet-lite2", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "74b1f90e484b366e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 58945358, "90.00 percentile latency (ns)": 104808275, "90th percentile latency (ns)": 104808275, "95.00 percentile latency (ns)": 190817224, "97.00 percentile latency (ns)": 231202465, "99.00 percentile latency (ns)": 251553252, "99.90 percentile latency (ns)": 255770259, "Max latency (ns)": 269917868, "Mean latency (ns)": 73806852, "Min duration satisfied": "Yes", "Min latency (ns)": 53582181, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 13.54, "QPS w/o loadgen overhead": 13.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 104.808275, "characteristics.90th_percentile_latency_ns": 104808275.0, "characteristics.90th_percentile_latency_s": 0.104808275, "characteristics.90th_percentile_latency_us": 104808.275, "characteristics.accuracy": 74.022, "characteristics.good": 37011, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "quantized-efficientnet-lite1", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "quantized-efficientnet-lite1", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "43eb8446caf5128a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 36983989, "90.00 percentile latency (ns)": 74255272, "90th percentile latency (ns)": 74255272, "95.00 percentile latency (ns)": 141291403, "97.00 percentile latency (ns)": 172370964, "99.00 percentile latency (ns)": 189912624, "99.90 percentile latency (ns)": 207617701, "Max latency (ns)": 214030377, "Mean latency (ns)": 50036414, "Min duration satisfied": "Yes", "Min latency (ns)": 34491401, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 20.0, "QPS w/o loadgen overhead": 19.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 74.255272, "characteristics.90th_percentile_latency_ns": 74255272.0, "characteristics.90th_percentile_latency_s": 0.074255272, "characteristics.90th_percentile_latency_us": 74255.272, "characteristics.accuracy": 71.23, "characteristics.good": 35615, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "quantized-efficientnet-lite0", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "quantized-efficientnet-lite0", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "172d18055b64cdfa", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 237949729, "90.00 percentile latency (ns)": 296174557, "90th percentile latency (ns)": 296174557, "95.00 percentile latency (ns)": 304218983, "97.00 percentile latency (ns)": 310045197, "99.00 percentile latency (ns)": 318150353, "99.90 percentile latency (ns)": 333483713, "Max latency (ns)": 333767965, "Mean latency (ns)": 228165581, "Min duration satisfied": "Yes", "Min latency (ns)": 119124203, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 4.38, "QPS w/o loadgen overhead": 4.38, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 296.174557, "characteristics.90th_percentile_latency_ns": 296174557.0, "characteristics.90th_percentile_latency_s": 0.296174557, "characteristics.90th_percentile_latency_us": 296174.557, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "non-quantized-efficientnet-lite2", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "non-quantized-efficientnet-lite2", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "cddb188aeb14708b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 493629230, "90.00 percentile latency (ns)": 542549738, "90th percentile latency (ns)": 542549738, "95.00 percentile latency (ns)": 554348211, "97.00 percentile latency (ns)": 562793187, "99.00 percentile latency (ns)": 574680043, "99.90 percentile latency (ns)": 582569642, "Max latency (ns)": 591846994, "Mean latency (ns)": 485360219, "Min duration satisfied": "Yes", "Min latency (ns)": 302836009, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.06, "QPS w/o loadgen overhead": 2.06, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 542.549738, "characteristics.90th_percentile_latency_ns": 542549738.0, "characteristics.90th_percentile_latency_s": 0.542549738, "characteristics.90th_percentile_latency_us": 542549.738, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "non-quantized-efficientnet-lite4", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "non-quantized-efficientnet-lite4", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "09834c7dba40faee", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 73088597, "90.00 percentile latency (ns)": 157331130, "90th percentile latency (ns)": 157331130, "95.00 percentile latency (ns)": 197286956, "97.00 percentile latency (ns)": 207254016, "99.00 percentile latency (ns)": 213512610, "99.90 percentile latency (ns)": 223863049, "Max latency (ns)": 233602984, "Mean latency (ns)": 87716938, "Min duration satisfied": "Yes", "Min latency (ns)": 61297075, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 11.4, "QPS w/o loadgen overhead": 11.4, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 157.33113, "characteristics.90th_percentile_latency_ns": 157331130.0, "characteristics.90th_percentile_latency_s": 0.15733113, "characteristics.90th_percentile_latency_us": 157331.13, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "non-quantized-efficientnet-lite0", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "non-quantized-efficientnet-lite0", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0e8a62eb5b334b21", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 76979480, "90.00 percentile latency (ns)": 87944605, "90th percentile latency (ns)": 87944605, "95.00 percentile latency (ns)": 90633466, "97.00 percentile latency (ns)": 92741106, "99.00 percentile latency (ns)": 99917841, "99.90 percentile latency (ns)": 108455695, "Max latency (ns)": 110312874, "Mean latency (ns)": 79445167, "Min duration satisfied": "Yes", "Min latency (ns)": 75026892, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 12.58, "QPS w/o loadgen overhead": 12.59, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 87.944605, "characteristics.90th_percentile_latency_ns": 87944605.0, "characteristics.90th_percentile_latency_s": 0.087944605, "characteristics.90th_percentile_latency_us": 87944.605, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "rpi4coral-armnn-v20.08-neon", "ck_used": true, "cooling": "MakerHawk Pi-FAN DC Brushless Cooling Fan LD3007MS", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4coral-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a195a68d8d4580bb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 132396284, "90.00 percentile latency (ns)": 161706928, "90th percentile latency (ns)": 161706928, "95.00 percentile latency (ns)": 171498359, "97.00 percentile latency (ns)": 177973665, "99.00 percentile latency (ns)": 193455995, "99.90 percentile latency (ns)": 284271075, "Max latency (ns)": 306818515, "Mean latency (ns)": 141690678, "Min duration satisfied": "Yes", "Min latency (ns)": 129370097, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 7.06, "QPS w/o loadgen overhead": 7.06, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 161.706928, "characteristics.90th_percentile_latency_ns": 161706928.0, "characteristics.90th_percentile_latency_s": 0.161706928, "characteristics.90th_percentile_latency_us": 161706.928, "characteristics.accuracy": 71.274, "characteristics.good": 35637, "characteristics.total": 50000, "ck_system": "rpi4coral-armnn-v20.08-neon", "ck_used": true, "cooling": "MakerHawk Pi-FAN DC Brushless Cooling Fan LD3007MS", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/rpi4coral-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-armnn-v20.08-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1c295f82e34bbea4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 87054593, "90.00 percentile latency (ns)": 87881447, "90th percentile latency (ns)": 87881447, "95.00 percentile latency (ns)": 88362710, "97.00 percentile latency (ns)": 89561442, "99.00 percentile latency (ns)": 97958194, "99.90 percentile latency (ns)": 108674310, "Max latency (ns)": 111068573, "Mean latency (ns)": 87058319, "Min duration satisfied": "Yes", "Min latency (ns)": 77599680, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 11.47, "QPS w/o loadgen overhead": 11.49, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 87.881447, "characteristics.90th_percentile_latency_ns": 87881447.0, "characteristics.90th_percentile_latency_s": 0.087881447, "characteristics.90th_percentile_latency_us": 87881.447, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-armnn-v20.08-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b32344114a19fb4b", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 431489077, "90.00 percentile latency (ns)": 433977908, "90th percentile latency (ns)": 433977908, "95.00 percentile latency (ns)": 435326403, "97.00 percentile latency (ns)": 438555092, "99.00 percentile latency (ns)": 441824494, "99.90 percentile latency (ns)": 453841955, "Max latency (ns)": 454127263, "Mean latency (ns)": 431215013, "Min duration satisfied": "Yes", "Min latency (ns)": 416268346, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.32, "QPS w/o loadgen overhead": 2.32, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 433.977908, "characteristics.90th_percentile_latency_ns": 433977908.0, "characteristics.90th_percentile_latency_s": 0.433977908, "characteristics.90th_percentile_latency_us": 433977.908, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-armnn-v20.08-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1c8a2b294d7e71ae", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 122312425, "90.00 percentile latency (ns)": 130113629, "90th percentile latency (ns)": 130113629, "95.00 percentile latency (ns)": 131643418, "97.00 percentile latency (ns)": 132207188, "99.00 percentile latency (ns)": 136094828, "99.90 percentile latency (ns)": 137346058, "Max latency (ns)": 142115957, "Mean latency (ns)": 123947393, "Min duration satisfied": "Yes", "Min latency (ns)": 121023007, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 8.06, "QPS w/o loadgen overhead": 8.07, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 130.113629, "characteristics.90th_percentile_latency_ns": 130113629.0, "characteristics.90th_percentile_latency_s": 0.130113629, "characteristics.90th_percentile_latency_us": 130113.629, "characteristics.accuracy": 71.232, "characteristics.good": 35616, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/open/dividiti/results/firefly-armnn-v20.08-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6d95f504289acd5c", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 109219386, "90.00 percentile latency (ns)": 119348397, "90th percentile latency (ns)": 119348397, "95.00 percentile latency (ns)": 122428912, "97.00 percentile latency (ns)": 125463306, "99.00 percentile latency (ns)": 133203621, "99.90 percentile latency (ns)": 157001209, "Max latency (ns)": 191684073, "Mean latency (ns)": 111547846, "Min duration satisfied": "Yes", "Min latency (ns)": 106300479, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 8.96, "QPS w/o loadgen overhead": 8.96, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 119.348397, "characteristics.90th_percentile_latency_ns": 119348397.0, "characteristics.90th_percentile_latency_s": 0.119348397, "characteristics.90th_percentile_latency_us": 119348.397, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.3.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.3.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/xavier-tflite-v2.3.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "PyCUDA 2019.1.2", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0. Experimental CMake build from post-v2.3.0/pre-v2.4.0 revision.", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.3.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "f97adf93994d405f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 402187342, "90.00 percentile latency (ns)": 418825218, "90th percentile latency (ns)": 418825218, "95.00 percentile latency (ns)": 422906181, "97.00 percentile latency (ns)": 425756822, "99.00 percentile latency (ns)": 433858628, "99.90 percentile latency (ns)": 511170965, "Max latency (ns)": 511212480, "Mean latency (ns)": 402850024, "Min duration satisfied": "Yes", "Min latency (ns)": 377178669, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.48, "QPS w/o loadgen overhead": 2.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 418.825218, "characteristics.90th_percentile_latency_ns": 418825218.0, "characteristics.90th_percentile_latency_s": 0.418825218, "characteristics.90th_percentile_latency_us": 418825.218, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4-armnn-v20.08-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/rpi4-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Raspbian Bullseye (Debian 11); kernel Linux rpi4 5.4.51-v7l+ #1327 SMP (Thu Jul 23 11:04:39 BST 2020)", "other_software_stack": "GCC 9.3.0; Python 3.7.9", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-armnn-v20.08-neon", "system_name": "Raspberry Pi 4 (rpi4)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.5, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "ace4936b5dc9b1ba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 77009559, "90.00 percentile latency (ns)": 86816813, "90th percentile latency (ns)": 86816813, "95.00 percentile latency (ns)": 91312407, "97.00 percentile latency (ns)": 94742925, "99.00 percentile latency (ns)": 103252300, "99.90 percentile latency (ns)": 135755759, "Max latency (ns)": 149307756, "Mean latency (ns)": 79669194, "Min duration satisfied": "Yes", "Min latency (ns)": 75200215, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 12.55, "QPS w/o loadgen overhead": 12.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 86.816813, "characteristics.90th_percentile_latency_ns": 86816813.0, "characteristics.90th_percentile_latency_s": 0.086816813, "characteristics.90th_percentile_latency_us": 86816.813, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "xavier-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/xavier-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "PyCUDA 2019.1.2", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tflite-v2.2.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 8.13008, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "ae0b4738ac55c54a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 2251810, "90.00 percentile latency (ns)": 2290468, "90th percentile latency (ns)": 2290468, "95.00 percentile latency (ns)": 2306533, "97.00 percentile latency (ns)": 2320229, "99.00 percentile latency (ns)": 2369575, "99.90 percentile latency (ns)": 2512845, "Max latency (ns)": 3917323, "Mean latency (ns)": 2259561, "Min duration satisfied": "Yes", "Min latency (ns)": 2198848, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 439.93, "QPS w/o loadgen overhead": 442.56, "Result is": "VALID", "SUT name": "PySUT", "Scenario": "singlestream", "accelerator_frequency": "", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "Shared with host", "accelerator_memory_configuration": "SRAM", "accelerator_model_name": "NVIDIA Xavier", "accelerator_on-chip_memories": "1MB (128KB/SM) L1 + 512KB L2 + 4MB (DLA)", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.290468, "characteristics.90th_percentile_latency_ns": 2290468.0, "characteristics.90th_percentile_latency_s": 0.002290468, "characteristics.90th_percentile_latency_us": 2290.468, "characteristics.accuracy": 76.258, "characteristics.good": 38129, "characteristics.total": 50000, "ck_system": "xavier-tensorrt-v6.0", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TensorRT v6.0", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "DLAs are not used in the Offline and MultiStream scenarios (GPU only)", "informal_model": "resnet50", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/xavier-tensorrt-v6.0", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://zenodo.org/record/3716059/files/resnet-SingleStream-gpu-b1-int8-linear.plan", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-tensorrt-v6.0", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c5e9f9b6d4697855", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "ONNX -> TensorRT" }, { "50.00 percentile latency (ns)": 594462704, "90.00 percentile latency (ns)": 612460091, "90th percentile latency (ns)": 612460091, "95.00 percentile latency (ns)": 654691420, "97.00 percentile latency (ns)": 777090835, "99.00 percentile latency (ns)": 807868713, "99.90 percentile latency (ns)": 838935422, "Max latency (ns)": 887009964, "Mean latency (ns)": 603999971, "Min duration satisfied": "Yes", "Min latency (ns)": 573131920, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 1.66, "QPS w/o loadgen overhead": 1.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 612.460091, "characteristics.90th_percentile_latency_ns": 612460091.0, "characteristics.90th_percentile_latency_s": 0.612460091, "characteristics.90th_percentile_latency_us": 612460.091, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4coral-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "MakerHawk Pi-FAN DC Brushless Cooling Fan LD3007MS", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/rpi4coral-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.1; kernel 5.4.0-1018-raspi #20-Ubuntu SMP (Sun Sep 6 05:11:16 UTC 2020)", "other_software_stack": "GCC 9.3.0; Python 3.8.2", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-tflite-v2.2.0-ruy", "system_name": "Raspberry Pi 4 with Coral (rpi4coral)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.42857, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "a4943e81656319cc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 366290049, "90.00 percentile latency (ns)": 367529816, "90th percentile latency (ns)": 367529816, "95.00 percentile latency (ns)": 367843332, "97.00 percentile latency (ns)": 368175143, "99.00 percentile latency (ns)": 369443806, "99.90 percentile latency (ns)": 374020177, "Max latency (ns)": 385745855, "Mean latency (ns)": 366355379, "Min duration satisfied": "Yes", "Min latency (ns)": 363725723, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.73, "QPS w/o loadgen overhead": 2.73, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 367.529816, "characteristics.90th_percentile_latency_ns": 367529816.0, "characteristics.90th_percentile_latency_s": 0.367529816, "characteristics.90th_percentile_latency_us": 367529.816, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/firefly-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "GCC 7.5.0; Python 3.5.2; OpenCL driver 1.2 v1.r13p0-00rel0-git(a4271c9).31ba04af2d3c01618138bef3aed66c2c", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-neon", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.5, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d801ca62ec949989", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 54354665, "90.00 percentile latency (ns)": 73281484, "90th percentile latency (ns)": 73281484, "95.00 percentile latency (ns)": 79760665, "97.00 percentile latency (ns)": 92973566, "99.00 percentile latency (ns)": 105632028, "99.90 percentile latency (ns)": 113682094, "Max latency (ns)": 113991702, "Mean latency (ns)": 59248970, "Min duration satisfied": "Yes", "Min latency (ns)": 51654559, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 16.87, "QPS w/o loadgen overhead": 16.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 73.281484, "characteristics.90th_percentile_latency_ns": 73281484.0, "characteristics.90th_percentile_latency_s": 0.073281484, "characteristics.90th_percentile_latency_us": 73281.484, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "xavier-armnn-v20.08-neon", "ck_used": true, "cooling": "", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/xavier-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "PyCUDA 2019.1.2", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-armnn-v20.08-neon", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "c9f7b4d7cb3849d6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 740072004, "90.00 percentile latency (ns)": 759539316, "90th percentile latency (ns)": 759539316, "95.00 percentile latency (ns)": 766643291, "97.00 percentile latency (ns)": 770167224, "99.00 percentile latency (ns)": 778577706, "99.90 percentile latency (ns)": 871489612, "Max latency (ns)": 881408945, "Mean latency (ns)": 740857168, "Min duration satisfied": "Yes", "Min latency (ns)": 692530967, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 1.35, "QPS w/o loadgen overhead": 1.35, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 759.539316, "characteristics.90th_percentile_latency_ns": 759539316.0, "characteristics.90th_percentile_latency_s": 0.759539316, "characteristics.90th_percentile_latency_us": 759539.316, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/rpi4-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Raspbian Bullseye (Debian 11); kernel Linux rpi4 5.4.51-v7l+ #1327 SMP (Thu Jul 23 11:04:39 BST 2020)", "other_software_stack": "GCC 9.3.0; Python 3.7.9", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4-tflite-v2.2.0-ruy", "system_name": "Raspberry Pi 4 (rpi4)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.42857, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "c08c4e7c82e5f6bc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 439464059, "90.00 percentile latency (ns)": 544726800, "90th percentile latency (ns)": 544726800, "95.00 percentile latency (ns)": 572200370, "97.00 percentile latency (ns)": 584122745, "99.00 percentile latency (ns)": 606464637, "99.90 percentile latency (ns)": 631151169, "Max latency (ns)": 640230615, "Mean latency (ns)": 456439132, "Min duration satisfied": "Yes", "Min latency (ns)": 390705336, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.19, "QPS w/o loadgen overhead": 2.19, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 544.7268, "characteristics.90th_percentile_latency_ns": 544726800.0, "characteristics.90th_percentile_latency_s": 0.5447268, "characteristics.90th_percentile_latency_us": 544726.8, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.2.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.2.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/firefly-tflite-v2.2.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "GCC 7.5.0; Python 3.5.2; OpenCL driver 1.2 v1.r13p0-00rel0-git(a4271c9).31ba04af2d3c01618138bef3aed66c2c", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.2.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.42857, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "444054a3c27e6d91", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 352151349, "90.00 percentile latency (ns)": 363624509, "90th percentile latency (ns)": 363624509, "95.00 percentile latency (ns)": 367198075, "97.00 percentile latency (ns)": 369972606, "99.00 percentile latency (ns)": 372311101, "99.90 percentile latency (ns)": 376700364, "Max latency (ns)": 376992490, "Mean latency (ns)": 352711193, "Min duration satisfied": "Yes", "Min latency (ns)": 337963041, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.83, "QPS w/o loadgen overhead": 2.84, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 363.624509, "characteristics.90th_percentile_latency_ns": 363624509.0, "characteristics.90th_percentile_latency_s": 0.363624509, "characteristics.90th_percentile_latency_us": 363624.509, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4coral-armnn-v20.08-neon", "ck_used": true, "cooling": "MakerHawk Pi-FAN DC Brushless Cooling Fan LD3007MS", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "https://www.raspberrypi.org/products/raspberry-pi-4-model-b/specifications/", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/rpi4coral-armnn-v20.08-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.1; kernel 5.4.0-1018-raspi #20-Ubuntu SMP (Sun Sep 6 05:11:16 UTC 2020)", "other_software_stack": "GCC 9.3.0; Python 3.8.2", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-armnn-v20.08-neon", "system_name": "Raspberry Pi 4 with Coral (rpi4coral)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.5, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "12f44de9c2346420", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 456045411, "90.00 percentile latency (ns)": 458246019, "90th percentile latency (ns)": 458246019, "95.00 percentile latency (ns)": 462346171, "97.00 percentile latency (ns)": 463735428, "99.00 percentile latency (ns)": 465700283, "99.90 percentile latency (ns)": 475616259, "Max latency (ns)": 483787909, "Mean latency (ns)": 456536767, "Min duration satisfied": "Yes", "Min latency (ns)": 445051288, "Min queries satisfied": "Yes", "Mode": "Performance", "QPS w/ loadgen overhead": 2.19, "QPS w/o loadgen overhead": 2.19, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 458.246019, "characteristics.90th_percentile_latency_ns": 458246019.0, "characteristics.90th_percentile_latency_s": 0.458246019, "characteristics.90th_percentile_latency_us": 458246.019, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "firefly-armnn-v20.08-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v20.08 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "http://en.t-firefly.com/product/rk3399/; http://opensource.rock-chips.com/wiki_RK3399", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 60000, "min_query_count": 1024, "mlperf_version": 0.7, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/code", "note_details": "https://github.com/mlcommons/inference_results_v0.7/tree/master/closed/dividiti/results/firefly-armnn-v20.08-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "GCC 7.5.0; Python 3.5.2; OpenCL driver 1.2 v1.r13p0-00rel0-git(a4271c9).31ba04af2d3c01618138bef3aed66c2c", "performance_issue_same": true, "performance_issue_same_index": 0, "performance_issue_unique": true, "performance_sample_count": 1024, "print_timestamps": true, "problem": false, "qsl_rng_seed": 12786827339337101903, "retraining": "no", "sample_index_rng_seed": 12640797754436136668, "samples_per_query": 1, "schedule_rng_seed": 3135815929913719677, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "dividiti", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/dividiti", "sw_notes": "Powered by Collective Knowledge v1.15.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v20.08-opencl", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.5, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "dc0054a998a5f040", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" } ]