[ { "50.00 percentile latency (ns)": 7272980, "90.00 percentile latency (ns)": 9629055, "90th percentile latency (ns)": 9629055, "95.00 percentile latency (ns)": 11572662, "97.00 percentile latency (ns)": 12899029, "99.00 percentile latency (ns)": 15576216, "99.90 percentile latency (ns)": 32024463, "Max latency (ns)": 74455334, "Mean latency (ns)": 7940213, "Min duration satisfied": "Yes", "Min latency (ns)": 6216617, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 125.63, "QPS w/o loadgen overhead": 125.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.629055, "characteristics.90th_percentile_latency_ns": 9629055.0, "characteristics.90th_percentile_latency_s": 0.009629055, "characteristics.90th_percentile_latency_us": 9629.055, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.power": 0.20621976879011483, "characteristics.power.normalized_per_core": 0.025777471098764354, "characteristics.power.normalized_per_processor": 0.20621976879011483, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "04ec0e4485fbc06e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7911166, "90.00 percentile latency (ns)": 10938850, "90th percentile latency (ns)": 10938850, "95.00 percentile latency (ns)": 12975998, "97.00 percentile latency (ns)": 14286099, "99.00 percentile latency (ns)": 17023210, "99.90 percentile latency (ns)": 35423488, "Max latency (ns)": 160785610, "Mean latency (ns)": 8640778, "Min duration satisfied": "Yes", "Min latency (ns)": 6641026, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 115.51, "QPS w/o loadgen overhead": 115.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.93885, "characteristics.90th_percentile_latency_ns": 10938850.0, "characteristics.90th_percentile_latency_s": 0.01093885, "characteristics.90th_percentile_latency_us": 10938.85, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.power": 0.220699899861769, "characteristics.power.normalized_per_core": 0.027587487482721124, "characteristics.power.normalized_per_processor": 0.220699899861769, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "dc90a6b2885441cc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 78625979, "90.00 percentile latency (ns)": 89772868, "90th percentile latency (ns)": 89772868, "95.00 percentile latency (ns)": 94199691, "97.00 percentile latency (ns)": 96538418, "99.00 percentile latency (ns)": 104299886, "99.90 percentile latency (ns)": 178814199, "Max latency (ns)": 192755891, "Mean latency (ns)": 79720976, "Min duration satisfied": "Yes", "Min latency (ns)": 67947737, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.54, "QPS w/o loadgen overhead": 12.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 89.772868, "characteristics.90th_percentile_latency_ns": 89772868.0, "characteristics.90th_percentile_latency_s": 0.089772868, "characteristics.90th_percentile_latency_us": 89772.868, "characteristics.accuracy": 78.514, "characteristics.good": 39257, "characteristics.power": 1.6909914651228932, "characteristics.power.normalized_per_core": 0.21137393314036165, "characteristics.power.normalized_per_processor": 1.6909914651228932, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.6582, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "e6df2c67bf44051b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6993247, "90.00 percentile latency (ns)": 9910143, "90th percentile latency (ns)": 9910143, "95.00 percentile latency (ns)": 12315725, "97.00 percentile latency (ns)": 13545418, "99.00 percentile latency (ns)": 15563205, "99.90 percentile latency (ns)": 30036056, "Max latency (ns)": 122747374, "Mean latency (ns)": 7726643, "Min duration satisfied": "Yes", "Min latency (ns)": 5955504, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 129.28, "QPS w/o loadgen overhead": 129.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.910143, "characteristics.90th_percentile_latency_ns": 9910143.0, "characteristics.90th_percentile_latency_s": 0.009910143, "characteristics.90th_percentile_latency_us": 9910.143, "characteristics.accuracy": 63.542, "characteristics.good": 31771, "characteristics.power": 0.15782821250657486, "characteristics.power.normalized_per_core": 0.019728526563321858, "characteristics.power.normalized_per_processor": 0.15782821250657486, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "694599969d4a659c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2265351, "90.00 percentile latency (ns)": 3374649, "90th percentile latency (ns)": 3374649, "95.00 percentile latency (ns)": 4198015, "97.00 percentile latency (ns)": 4574064, "99.00 percentile latency (ns)": 6696975, "99.90 percentile latency (ns)": 20101170, "Max latency (ns)": 135472817, "Mean latency (ns)": 2591644, "Min duration satisfied": "Yes", "Min latency (ns)": 1831443, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 384.01, "QPS w/o loadgen overhead": 385.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.374649, "characteristics.90th_percentile_latency_ns": 3374649.0, "characteristics.90th_percentile_latency_s": 0.003374649, "characteristics.90th_percentile_latency_us": 3374.649, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.power": 0.05911729065377804, "characteristics.power.normalized_per_core": 0.007389661331722255, "characteristics.power.normalized_per_processor": 0.05911729065377804, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "49dd3d26471e60cd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2468086, "90.00 percentile latency (ns)": 3988450, "90th percentile latency (ns)": 3988450, "95.00 percentile latency (ns)": 4715488, "97.00 percentile latency (ns)": 5410020, "99.00 percentile latency (ns)": 8200873, "99.90 percentile latency (ns)": 22693278, "Max latency (ns)": 123334660, "Mean latency (ns)": 2887360, "Min duration satisfied": "Yes", "Min latency (ns)": 2010655, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 344.83, "QPS w/o loadgen overhead": 346.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.98845, "characteristics.90th_percentile_latency_ns": 3988450.0, "characteristics.90th_percentile_latency_s": 0.00398845, "characteristics.90th_percentile_latency_us": 3988.45, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.power": 0.0671766715966322, "characteristics.power.normalized_per_core": 0.008397083949579024, "characteristics.power.normalized_per_processor": 0.0671766715966322, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "7b9dffa95b4402d8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4681071, "90.00 percentile latency (ns)": 6842036, "90th percentile latency (ns)": 6842036, "95.00 percentile latency (ns)": 8190831, "97.00 percentile latency (ns)": 9317791, "99.00 percentile latency (ns)": 11976858, "99.90 percentile latency (ns)": 28056652, "Max latency (ns)": 127344079, "Mean latency (ns)": 5325011, "Min duration satisfied": "Yes", "Min latency (ns)": 3852844, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 187.27, "QPS w/o loadgen overhead": 187.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.842036, "characteristics.90th_percentile_latency_ns": 6842036.0, "characteristics.90th_percentile_latency_s": 0.006842036, "characteristics.90th_percentile_latency_us": 6842.036, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.power": 0.12634835790556648, "characteristics.power.normalized_per_core": 0.01579354473819581, "characteristics.power.normalized_per_processor": 0.12634835790556648, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "8288b2a1f3f41fba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2589166, "90.00 percentile latency (ns)": 3689949, "90th percentile latency (ns)": 3689949, "95.00 percentile latency (ns)": 4333752, "97.00 percentile latency (ns)": 4897362, "99.00 percentile latency (ns)": 7005770, "99.90 percentile latency (ns)": 18754400, "Max latency (ns)": 63487856, "Mean latency (ns)": 2892981, "Min duration satisfied": "Yes", "Min latency (ns)": 2138811, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 344.99, "QPS w/o loadgen overhead": 345.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.689949, "characteristics.90th_percentile_latency_ns": 3689949.0, "characteristics.90th_percentile_latency_s": 0.003689949, "characteristics.90th_percentile_latency_us": 3689.949, "characteristics.accuracy": 48.162, "characteristics.good": 24081, "characteristics.power": 0.05831590277536222, "characteristics.power.normalized_per_core": 0.007289487846920278, "characteristics.power.normalized_per_processor": 0.05831590277536222, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "053c4c1243caa9ab", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13188553, "90.00 percentile latency (ns)": 19281168, "90th percentile latency (ns)": 19281168, "95.00 percentile latency (ns)": 20520711, "97.00 percentile latency (ns)": 21645729, "99.00 percentile latency (ns)": 26984860, "99.90 percentile latency (ns)": 46796519, "Max latency (ns)": 133426846, "Mean latency (ns)": 14663460, "Min duration satisfied": "Yes", "Min latency (ns)": 10358851, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 68.1, "QPS w/o loadgen overhead": 68.2, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.281168, "characteristics.90th_percentile_latency_ns": 19281168.0, "characteristics.90th_percentile_latency_s": 0.019281168, "characteristics.90th_percentile_latency_us": 19281.168, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.power": 0.38565563359289756, "characteristics.power.normalized_per_core": 0.048206954199112195, "characteristics.power.normalized_per_processor": 0.38565563359289756, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "dcf8889a8ea5de7b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3002217, "90.00 percentile latency (ns)": 4357998, "90th percentile latency (ns)": 4357998, "95.00 percentile latency (ns)": 5207981, "97.00 percentile latency (ns)": 6082756, "99.00 percentile latency (ns)": 8310956, "99.90 percentile latency (ns)": 21694318, "Max latency (ns)": 69956547, "Mean latency (ns)": 3413612, "Min duration satisfied": "Yes", "Min latency (ns)": 2516921, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 292.48, "QPS w/o loadgen overhead": 292.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.357998, "characteristics.90th_percentile_latency_ns": 4357998.0, "characteristics.90th_percentile_latency_s": 0.004357998, "characteristics.90th_percentile_latency_us": 4357.998, "characteristics.accuracy": 50.242, "characteristics.good": 25121, "characteristics.power": 0.06892525542620424, "characteristics.power.normalized_per_core": 0.00861565692827553, "characteristics.power.normalized_per_processor": 0.06892525542620424, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4506c470cb268753", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3167284, "90.00 percentile latency (ns)": 4934762, "90th percentile latency (ns)": 4934762, "95.00 percentile latency (ns)": 5907637, "97.00 percentile latency (ns)": 6816540, "99.00 percentile latency (ns)": 9020998, "99.90 percentile latency (ns)": 23110114, "Max latency (ns)": 72862640, "Mean latency (ns)": 3701150, "Min duration satisfied": "Yes", "Min latency (ns)": 2675581, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 269.23, "QPS w/o loadgen overhead": 270.19, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.934762, "characteristics.90th_percentile_latency_ns": 4934762.0, "characteristics.90th_percentile_latency_s": 0.004934762, "characteristics.90th_percentile_latency_us": 4934.762, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.power": 0.08935865387948748, "characteristics.power.normalized_per_core": 0.011169831734935935, "characteristics.power.normalized_per_processor": 0.08935865387948748, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "7c815a5c384f16ac", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6575562, "90.00 percentile latency (ns)": 9103972, "90th percentile latency (ns)": 9103972, "95.00 percentile latency (ns)": 11016020, "97.00 percentile latency (ns)": 12343545, "99.00 percentile latency (ns)": 15188400, "99.90 percentile latency (ns)": 35668012, "Max latency (ns)": 128413159, "Mean latency (ns)": 7311525, "Min duration satisfied": "Yes", "Min latency (ns)": 5146733, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 136.46, "QPS w/o loadgen overhead": 136.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.103972, "characteristics.90th_percentile_latency_ns": 9103972.0, "characteristics.90th_percentile_latency_s": 0.009103972, "characteristics.90th_percentile_latency_us": 9103.972, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.power": 0.18461567587109887, "characteristics.power.normalized_per_core": 0.02307695948388736, "characteristics.power.normalized_per_processor": 0.18461567587109887, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "68c4acc97a8e8115", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22649810, "90.00 percentile latency (ns)": 30262782, "90th percentile latency (ns)": 30262782, "95.00 percentile latency (ns)": 32513672, "97.00 percentile latency (ns)": 34583235, "99.00 percentile latency (ns)": 40767709, "99.90 percentile latency (ns)": 78885616, "Max latency (ns)": 157675748, "Mean latency (ns)": 24169196, "Min duration satisfied": "Yes", "Min latency (ns)": 19463689, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.35, "QPS w/o loadgen overhead": 41.37, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 30.262782, "characteristics.90th_percentile_latency_ns": 30262782.0, "characteristics.90th_percentile_latency_s": 0.030262782, "characteristics.90th_percentile_latency_us": 30262.782, "characteristics.accuracy": 74.098, "characteristics.good": 37049, "characteristics.power": 0.5007269037841079, "characteristics.power.normalized_per_core": 0.06259086297301349, "characteristics.power.normalized_per_processor": 0.5007269037841079, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "f13b4e4bb60ae785", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5512629, "90.00 percentile latency (ns)": 8097241, "90th percentile latency (ns)": 8097241, "95.00 percentile latency (ns)": 10121206, "97.00 percentile latency (ns)": 11417179, "99.00 percentile latency (ns)": 13469131, "99.90 percentile latency (ns)": 29671679, "Max latency (ns)": 122685286, "Mean latency (ns)": 6320826, "Min duration satisfied": "Yes", "Min latency (ns)": 4756739, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 157.98, "QPS w/o loadgen overhead": 158.21, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.097241, "characteristics.90th_percentile_latency_ns": 8097241.0, "characteristics.90th_percentile_latency_s": 0.008097241, "characteristics.90th_percentile_latency_us": 8097.241, "characteristics.accuracy": 61.924, "characteristics.good": 30962, "characteristics.power": 0.12777007980014077, "characteristics.power.normalized_per_core": 0.015971259975017596, "characteristics.power.normalized_per_processor": 0.12777007980014077, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "bb8ed0cecd4729a5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5675430, "90.00 percentile latency (ns)": 8679440, "90th percentile latency (ns)": 8679440, "95.00 percentile latency (ns)": 10599911, "97.00 percentile latency (ns)": 11677466, "99.00 percentile latency (ns)": 13510318, "99.90 percentile latency (ns)": 28355290, "Max latency (ns)": 75798944, "Mean latency (ns)": 6434368, "Min duration satisfied": "Yes", "Min latency (ns)": 4948740, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 155.2, "QPS w/o loadgen overhead": 155.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.67944, "characteristics.90th_percentile_latency_ns": 8679440.0, "characteristics.90th_percentile_latency_s": 0.00867944, "characteristics.90th_percentile_latency_us": 8679.44, "characteristics.accuracy": 62.298, "characteristics.good": 31149, "characteristics.power": 0.13143239301700219, "characteristics.power.normalized_per_core": 0.016429049127125273, "characteristics.power.normalized_per_processor": 0.13143239301700219, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "a3a95cb56d44fdfb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2754562, "90.00 percentile latency (ns)": 3943099, "90th percentile latency (ns)": 3943099, "95.00 percentile latency (ns)": 4446674, "97.00 percentile latency (ns)": 4824392, "99.00 percentile latency (ns)": 7038218, "99.90 percentile latency (ns)": 21686764, "Max latency (ns)": 129179319, "Mean latency (ns)": 3095085, "Min duration satisfied": "Yes", "Min latency (ns)": 2381040, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 322.52, "QPS w/o loadgen overhead": 323.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.943099, "characteristics.90th_percentile_latency_ns": 3943099.0, "characteristics.90th_percentile_latency_s": 0.003943099, "characteristics.90th_percentile_latency_us": 3943.099, "characteristics.accuracy": 49.12, "characteristics.good": 24560, "characteristics.power": 0.06122496036446095, "characteristics.power.normalized_per_core": 0.007653120045557619, "characteristics.power.normalized_per_processor": 0.06122496036446095, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4fb7b4ecac6bcbaf", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22499902, "90.00 percentile latency (ns)": 29464475, "90th percentile latency (ns)": 29464475, "95.00 percentile latency (ns)": 32793618, "97.00 percentile latency (ns)": 36308786, "99.00 percentile latency (ns)": 42190941, "99.90 percentile latency (ns)": 71603351, "Max latency (ns)": 149480489, "Mean latency (ns)": 23939449, "Min duration satisfied": "Yes", "Min latency (ns)": 19285101, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.75, "QPS w/o loadgen overhead": 41.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.464475, "characteristics.90th_percentile_latency_ns": 29464475.0, "characteristics.90th_percentile_latency_s": 0.029464475, "characteristics.90th_percentile_latency_us": 29464.475, "characteristics.accuracy": 73.584, "characteristics.good": 36792, "characteristics.power": 0.49394273664172983, "characteristics.power.normalized_per_core": 0.06174284208021623, "characteristics.power.normalized_per_processor": 0.49394273664172983, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "e3acbfdf1943e694", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16301685, "90.00 percentile latency (ns)": 19529412, "90th percentile latency (ns)": 19529412, "95.00 percentile latency (ns)": 21500153, "97.00 percentile latency (ns)": 22566635, "99.00 percentile latency (ns)": 26088867, "99.90 percentile latency (ns)": 52406256, "Max latency (ns)": 93765880, "Mean latency (ns)": 16976853, "Min duration satisfied": "Yes", "Min latency (ns)": 14077841, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 58.86, "QPS w/o loadgen overhead": 58.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.529412, "characteristics.90th_percentile_latency_ns": 19529412.0, "characteristics.90th_percentile_latency_s": 0.019529412, "characteristics.90th_percentile_latency_us": 19529.412, "characteristics.accuracy": 70.772, "characteristics.good": 35386, "characteristics.power": 0.349767709496131, "characteristics.power.normalized_per_core": 0.043720963687016376, "characteristics.power.normalized_per_processor": 0.349767709496131, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "b4d744cabc88a4f8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1868215, "90.00 percentile latency (ns)": 2594904, "90th percentile latency (ns)": 2594904, "95.00 percentile latency (ns)": 2988938, "97.00 percentile latency (ns)": 3418879, "99.00 percentile latency (ns)": 4512690, "99.90 percentile latency (ns)": 16145899, "Max latency (ns)": 68488992, "Mean latency (ns)": 2072893, "Min duration satisfied": "Yes", "Min latency (ns)": 1608586, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 481.03, "QPS w/o loadgen overhead": 482.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.594904, "characteristics.90th_percentile_latency_ns": 2594904.0, "characteristics.90th_percentile_latency_s": 0.002594904, "characteristics.90th_percentile_latency_us": 2594.904, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.power": 0.0465621489773787, "characteristics.power.normalized_per_core": 0.005820268622172338, "characteristics.power.normalized_per_processor": 0.0465621489773787, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "ef543a9a4c3f36dc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3682414, "90.00 percentile latency (ns)": 5579233, "90th percentile latency (ns)": 5579233, "95.00 percentile latency (ns)": 6600587, "97.00 percentile latency (ns)": 7782183, "99.00 percentile latency (ns)": 10658674, "99.90 percentile latency (ns)": 27272082, "Max latency (ns)": 123568126, "Mean latency (ns)": 4277698, "Min duration satisfied": "Yes", "Min latency (ns)": 2938248, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 232.94, "QPS w/o loadgen overhead": 233.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.579233, "characteristics.90th_percentile_latency_ns": 5579233.0, "characteristics.90th_percentile_latency_s": 0.005579233, "characteristics.90th_percentile_latency_us": 5579.233, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.power": 0.1020411915882501, "characteristics.power.normalized_per_core": 0.012755148948531263, "characteristics.power.normalized_per_processor": 0.1020411915882501, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "2342e28cddfa1f37", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3149970, "90.00 percentile latency (ns)": 4029306, "90th percentile latency (ns)": 4029306, "95.00 percentile latency (ns)": 4722618, "97.00 percentile latency (ns)": 5274996, "99.00 percentile latency (ns)": 7352887, "99.90 percentile latency (ns)": 21464031, "Max latency (ns)": 82111275, "Mean latency (ns)": 3435341, "Min duration satisfied": "Yes", "Min latency (ns)": 2695420, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 290.22, "QPS w/o loadgen overhead": 291.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.029306, "characteristics.90th_percentile_latency_ns": 4029306.0, "characteristics.90th_percentile_latency_s": 0.004029306, "characteristics.90th_percentile_latency_us": 4029.306, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.power": 0.08086796223554552, "characteristics.power.normalized_per_core": 0.01010849527944319, "characteristics.power.normalized_per_processor": 0.08086796223554552, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "48ff4a18484b835f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4655066, "90.00 percentile latency (ns)": 6596660, "90th percentile latency (ns)": 6596660, "95.00 percentile latency (ns)": 8217536, "97.00 percentile latency (ns)": 9571745, "99.00 percentile latency (ns)": 11924108, "99.90 percentile latency (ns)": 26088262, "Max latency (ns)": 125972920, "Mean latency (ns)": 5287509, "Min duration satisfied": "Yes", "Min latency (ns)": 3957465, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 188.84, "QPS w/o loadgen overhead": 189.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.59666, "characteristics.90th_percentile_latency_ns": 6596660.0, "characteristics.90th_percentile_latency_s": 0.00659666, "characteristics.90th_percentile_latency_us": 6596.66, "characteristics.accuracy": 59.226, "characteristics.good": 29613, "characteristics.power": 0.1043710393741373, "characteristics.power.normalized_per_core": 0.013046379921767163, "characteristics.power.normalized_per_processor": 0.1043710393741373, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4920baa80d7980a5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9626867, "90.00 percentile latency (ns)": 11938267, "90th percentile latency (ns)": 11938267, "95.00 percentile latency (ns)": 14228675, "97.00 percentile latency (ns)": 15428633, "99.00 percentile latency (ns)": 18222744, "99.90 percentile latency (ns)": 39503609, "Max latency (ns)": 79216507, "Mean latency (ns)": 10337667, "Min duration satisfied": "Yes", "Min latency (ns)": 8190387, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 96.62, "QPS w/o loadgen overhead": 96.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.938267, "characteristics.90th_percentile_latency_ns": 11938267.0, "characteristics.90th_percentile_latency_s": 0.011938267, "characteristics.90th_percentile_latency_us": 11938.267, "characteristics.accuracy": 68.248, "characteristics.good": 34124, "characteristics.power": 0.21179553655827202, "characteristics.power.normalized_per_core": 0.026474442069784002, "characteristics.power.normalized_per_processor": 0.21179553655827202, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "c55ea04e10b31dfb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4378086, "90.00 percentile latency (ns)": 6804404, "90th percentile latency (ns)": 6804404, "95.00 percentile latency (ns)": 8571427, "97.00 percentile latency (ns)": 9954785, "99.00 percentile latency (ns)": 12294122, "99.90 percentile latency (ns)": 27509494, "Max latency (ns)": 128000686, "Mean latency (ns)": 5142050, "Min duration satisfied": "Yes", "Min latency (ns)": 3727176, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 194.21, "QPS w/o loadgen overhead": 194.47, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.804404, "characteristics.90th_percentile_latency_ns": 6804404.0, "characteristics.90th_percentile_latency_s": 0.006804404, "characteristics.90th_percentile_latency_us": 6804.404, "characteristics.accuracy": 59.12, "characteristics.good": 29560, "characteristics.power": 0.1018509717294776, "characteristics.power.normalized_per_core": 0.0127313714661847, "characteristics.power.normalized_per_processor": 0.1018509717294776, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "cd3f7649ad9fd11c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4523192, "90.00 percentile latency (ns)": 6214310, "90th percentile latency (ns)": 6214310, "95.00 percentile latency (ns)": 6917674, "97.00 percentile latency (ns)": 8119558, "99.00 percentile latency (ns)": 11018002, "99.90 percentile latency (ns)": 24635037, "Max latency (ns)": 71195600, "Mean latency (ns)": 5058455, "Min duration satisfied": "Yes", "Min latency (ns)": 4011043, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 197.4, "QPS w/o loadgen overhead": 197.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.21431, "characteristics.90th_percentile_latency_ns": 6214310.0, "characteristics.90th_percentile_latency_s": 0.00621431, "characteristics.90th_percentile_latency_us": 6214.31, "characteristics.accuracy": 58.46, "characteristics.good": 29230, "characteristics.power": 0.1020471857897199, "characteristics.power.normalized_per_core": 0.012755898223714987, "characteristics.power.normalized_per_processor": 0.1020471857897199, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "92cc8fba47d8b7ba", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12917624, "90.00 percentile latency (ns)": 18922679, "90th percentile latency (ns)": 18922679, "95.00 percentile latency (ns)": 20467190, "97.00 percentile latency (ns)": 21640216, "99.00 percentile latency (ns)": 25918506, "99.90 percentile latency (ns)": 46384423, "Max latency (ns)": 128637499, "Mean latency (ns)": 14136954, "Min duration satisfied": "Yes", "Min latency (ns)": 10903074, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 70.66, "QPS w/o loadgen overhead": 70.74, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.922679, "characteristics.90th_percentile_latency_ns": 18922679.0, "characteristics.90th_percentile_latency_s": 0.018922679, "characteristics.90th_percentile_latency_us": 18922.679, "characteristics.accuracy": 72.91, "characteristics.good": 36455, "characteristics.power": 0.2929123298591704, "characteristics.power.normalized_per_core": 0.0366140412323963, "characteristics.power.normalized_per_processor": 0.2929123298591704, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "d6c9934c6e952942", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14173416, "90.00 percentile latency (ns)": 21286241, "90th percentile latency (ns)": 21286241, "95.00 percentile latency (ns)": 24615131, "97.00 percentile latency (ns)": 27119050, "99.00 percentile latency (ns)": 30658809, "99.90 percentile latency (ns)": 58881312, "Max latency (ns)": 137478978, "Mean latency (ns)": 15724905, "Min duration satisfied": "Yes", "Min latency (ns)": 11302529, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 63.54, "QPS w/o loadgen overhead": 63.59, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.286241, "characteristics.90th_percentile_latency_ns": 21286241.0, "characteristics.90th_percentile_latency_s": 0.021286241, "characteristics.90th_percentile_latency_us": 21286.241, "characteristics.accuracy": 70.542, "characteristics.good": 35271, "characteristics.power": 0.3142789659495668, "characteristics.power.normalized_per_core": 0.03928487074369585, "characteristics.power.normalized_per_processor": 0.3142789659495668, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "ab876004e8292ce7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4591710, "90.00 percentile latency (ns)": 6385803, "90th percentile latency (ns)": 6385803, "95.00 percentile latency (ns)": 7656678, "97.00 percentile latency (ns)": 9014886, "99.00 percentile latency (ns)": 11705945, "99.90 percentile latency (ns)": 26008317, "Max latency (ns)": 112191236, "Mean latency (ns)": 5177181, "Min duration satisfied": "Yes", "Min latency (ns)": 3957242, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 192.89, "QPS w/o loadgen overhead": 193.16, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.385803, "characteristics.90th_percentile_latency_ns": 6385803.0, "characteristics.90th_percentile_latency_s": 0.006385803, "characteristics.90th_percentile_latency_us": 6385.803, "characteristics.accuracy": 56.594, "characteristics.good": 28297, "characteristics.power": 0.10359468856493087, "characteristics.power.normalized_per_core": 0.012949336070616359, "characteristics.power.normalized_per_processor": 0.10359468856493087, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "e2a41bbbd7059352", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8176375, "90.00 percentile latency (ns)": 13853309, "90th percentile latency (ns)": 13853309, "95.00 percentile latency (ns)": 15363650, "97.00 percentile latency (ns)": 16305037, "99.00 percentile latency (ns)": 19024073, "99.90 percentile latency (ns)": 38040819, "Max latency (ns)": 132926394, "Mean latency (ns)": 9393196, "Min duration satisfied": "Yes", "Min latency (ns)": 6567821, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 106.34, "QPS w/o loadgen overhead": 106.46, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.853309, "characteristics.90th_percentile_latency_ns": 13853309.0, "characteristics.90th_percentile_latency_s": 0.013853309, "characteristics.90th_percentile_latency_us": 13853.309, "characteristics.accuracy": 67.82, "characteristics.good": 33910, "characteristics.power": 0.19224865834085653, "characteristics.power.normalized_per_core": 0.024031082292607066, "characteristics.power.normalized_per_processor": 0.19224865834085653, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4518b2b11ebf48e0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1558507, "90.00 percentile latency (ns)": 2268546, "90th percentile latency (ns)": 2268546, "95.00 percentile latency (ns)": 2682223, "97.00 percentile latency (ns)": 3056785, "99.00 percentile latency (ns)": 3914927, "99.90 percentile latency (ns)": 13227837, "Max latency (ns)": 73961783, "Mean latency (ns)": 1753878, "Min duration satisfied": "Yes", "Min latency (ns)": 1331872, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 568.65, "QPS w/o loadgen overhead": 570.17, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.268546, "characteristics.90th_percentile_latency_ns": 2268546.0, "characteristics.90th_percentile_latency_s": 0.002268546, "characteristics.90th_percentile_latency_us": 2268.546, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.power": 0.0384545274426255, "characteristics.power.normalized_per_core": 0.004806815930328188, "characteristics.power.normalized_per_processor": 0.0384545274426255, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "dde7b8126a9477b8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2068094, "90.00 percentile latency (ns)": 3030412, "90th percentile latency (ns)": 3030412, "95.00 percentile latency (ns)": 3568197, "97.00 percentile latency (ns)": 3976951, "99.00 percentile latency (ns)": 5664389, "99.90 percentile latency (ns)": 15547597, "Max latency (ns)": 62200196, "Mean latency (ns)": 2323470, "Min duration satisfied": "Yes", "Min latency (ns)": 1710702, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 429.59, "QPS w/o loadgen overhead": 430.39, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.030412, "characteristics.90th_percentile_latency_ns": 3030412.0, "characteristics.90th_percentile_latency_s": 0.003030412, "characteristics.90th_percentile_latency_us": 3030.412, "characteristics.accuracy": 45.494, "characteristics.good": 22747, "characteristics.power": 0.04676249059180456, "characteristics.power.normalized_per_core": 0.00584531132397557, "characteristics.power.normalized_per_processor": 0.04676249059180456, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "34c458782a9f33a4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11473480, "90.00 percentile latency (ns)": 15845086, "90th percentile latency (ns)": 15845086, "95.00 percentile latency (ns)": 17058437, "97.00 percentile latency (ns)": 17949998, "99.00 percentile latency (ns)": 22140171, "99.90 percentile latency (ns)": 41552937, "Max latency (ns)": 82658104, "Mean latency (ns)": 12462055, "Min duration satisfied": "Yes", "Min latency (ns)": 8534083, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 80.12, "QPS w/o loadgen overhead": 80.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.845086, "characteristics.90th_percentile_latency_ns": 15845086.0, "characteristics.90th_percentile_latency_s": 0.015845086, "characteristics.90th_percentile_latency_us": 15845.086, "characteristics.accuracy": 70.626, "characteristics.good": 35313, "characteristics.power": 0.328103742239552, "characteristics.power.normalized_per_core": 0.041012967779944, "characteristics.power.normalized_per_processor": 0.328103742239552, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "642629cd56714223", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6354116, "90.00 percentile latency (ns)": 9581751, "90th percentile latency (ns)": 9581751, "95.00 percentile latency (ns)": 11643172, "97.00 percentile latency (ns)": 12851213, "99.00 percentile latency (ns)": 14993594, "99.90 percentile latency (ns)": 33768461, "Max latency (ns)": 128921015, "Mean latency (ns)": 7224611, "Min duration satisfied": "Yes", "Min latency (ns)": 5120138, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 138.24, "QPS w/o loadgen overhead": 138.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.581751, "characteristics.90th_percentile_latency_ns": 9581751.0, "characteristics.90th_percentile_latency_s": 0.009581751, "characteristics.90th_percentile_latency_us": 9581.751, "characteristics.accuracy": 63.454, "characteristics.good": 31727, "characteristics.power": 0.14612452617263227, "characteristics.power.normalized_per_core": 0.018265565771579034, "characteristics.power.normalized_per_processor": 0.14612452617263227, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "e603684e80beccd4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12063631, "90.00 percentile latency (ns)": 14007817, "90th percentile latency (ns)": 14007817, "95.00 percentile latency (ns)": 15204704, "97.00 percentile latency (ns)": 16719939, "99.00 percentile latency (ns)": 20739164, "99.90 percentile latency (ns)": 46602609, "Max latency (ns)": 83461607, "Mean latency (ns)": 12639288, "Min duration satisfied": "Yes", "Min latency (ns)": 10452994, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 79.03, "QPS w/o loadgen overhead": 79.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.007817, "characteristics.90th_percentile_latency_ns": 14007817.0, "characteristics.90th_percentile_latency_s": 0.014007817, "characteristics.90th_percentile_latency_us": 14007.817, "characteristics.accuracy": 70.04, "characteristics.good": 35020, "characteristics.power": 0.26138433803596306, "characteristics.power.normalized_per_core": 0.03267304225449538, "characteristics.power.normalized_per_processor": 0.26138433803596306, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "5448bb09b6d39ffb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30677651, "90.00 percentile latency (ns)": 41117917, "90th percentile latency (ns)": 41117917, "95.00 percentile latency (ns)": 44795886, "97.00 percentile latency (ns)": 48510785, "99.00 percentile latency (ns)": 54832846, "99.90 percentile latency (ns)": 96377529, "Max latency (ns)": 154675726, "Mean latency (ns)": 32949910, "Min duration satisfied": "Yes", "Min latency (ns)": 26110754, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 30.33, "QPS w/o loadgen overhead": 30.35, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 41.117917, "characteristics.90th_percentile_latency_ns": 41117917.0, "characteristics.90th_percentile_latency_s": 0.041117917, "characteristics.90th_percentile_latency_us": 41117.917, "characteristics.accuracy": 74.124, "characteristics.good": 37062, "characteristics.power": 0.69294528179972, "characteristics.power.normalized_per_core": 0.086618160224965, "characteristics.power.normalized_per_processor": 0.69294528179972, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.7778, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "bf80ca6f67649aca", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3418906, "90.00 percentile latency (ns)": 5402612, "90th percentile latency (ns)": 5402612, "95.00 percentile latency (ns)": 6862680, "97.00 percentile latency (ns)": 8040460, "99.00 percentile latency (ns)": 10257266, "99.90 percentile latency (ns)": 23474084, "Max latency (ns)": 76043495, "Mean latency (ns)": 4038549, "Min duration satisfied": "Yes", "Min latency (ns)": 2937861, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 247.23, "QPS w/o loadgen overhead": 247.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.402612, "characteristics.90th_percentile_latency_ns": 5402612.0, "characteristics.90th_percentile_latency_s": 0.005402612, "characteristics.90th_percentile_latency_us": 5402.612, "characteristics.accuracy": 59.444, "characteristics.good": 29722, "characteristics.power": 0.08136734471000807, "characteristics.power.normalized_per_core": 0.01017091808875101, "characteristics.power.normalized_per_processor": 0.08136734471000807, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "331244901bd644c3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4461975, "90.00 percentile latency (ns)": 6648225, "90th percentile latency (ns)": 6648225, "95.00 percentile latency (ns)": 8682659, "97.00 percentile latency (ns)": 9794808, "99.00 percentile latency (ns)": 11635537, "99.90 percentile latency (ns)": 26625187, "Max latency (ns)": 72033836, "Mean latency (ns)": 5147098, "Min duration satisfied": "Yes", "Min latency (ns)": 3961599, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 194.01, "QPS w/o loadgen overhead": 194.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.648225, "characteristics.90th_percentile_latency_ns": 6648225.0, "characteristics.90th_percentile_latency_s": 0.006648225, "characteristics.90th_percentile_latency_us": 6648.225, "characteristics.accuracy": 61.456, "characteristics.good": 30728, "characteristics.power": 0.10415101455251449, "characteristics.power.normalized_per_core": 0.013018876819064312, "characteristics.power.normalized_per_processor": 0.10415101455251449, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "bfe0ccae14180ab2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5823134, "90.00 percentile latency (ns)": 7851284, "90th percentile latency (ns)": 7851284, "95.00 percentile latency (ns)": 9964376, "97.00 percentile latency (ns)": 11345012, "99.00 percentile latency (ns)": 13578001, "99.90 percentile latency (ns)": 29961386, "Max latency (ns)": 120233923, "Mean latency (ns)": 6477502, "Min duration satisfied": "Yes", "Min latency (ns)": 4939795, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 154.18, "QPS w/o loadgen overhead": 154.38, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.851284, "characteristics.90th_percentile_latency_ns": 7851284.0, "characteristics.90th_percentile_latency_s": 0.007851284, "characteristics.90th_percentile_latency_us": 7851.284, "characteristics.accuracy": 58.528, "characteristics.good": 29264, "characteristics.power": 0.12871309508366857, "characteristics.power.normalized_per_core": 0.01608913688545857, "characteristics.power.normalized_per_processor": 0.12871309508366857, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "7013bb4f6db5abe7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4504046, "90.00 percentile latency (ns)": 6418373, "90th percentile latency (ns)": 6418373, "95.00 percentile latency (ns)": 7603770, "97.00 percentile latency (ns)": 8731055, "99.00 percentile latency (ns)": 11597106, "99.90 percentile latency (ns)": 28114500, "Max latency (ns)": 120350900, "Mean latency (ns)": 5070490, "Min duration satisfied": "Yes", "Min latency (ns)": 3686921, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 196.65, "QPS w/o loadgen overhead": 197.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.418373, "characteristics.90th_percentile_latency_ns": 6418373.0, "characteristics.90th_percentile_latency_s": 0.006418373, "characteristics.90th_percentile_latency_us": 6418.373, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.power": 0.12492499364352899, "characteristics.power.normalized_per_core": 0.015615624205441124, "characteristics.power.normalized_per_processor": 0.12492499364352899, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "d8674149945d0c0a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19622143, "90.00 percentile latency (ns)": 26600140, "90th percentile latency (ns)": 26600140, "95.00 percentile latency (ns)": 28258624, "97.00 percentile latency (ns)": 29684798, "99.00 percentile latency (ns)": 35725489, "99.90 percentile latency (ns)": 62252058, "Max latency (ns)": 166883444, "Mean latency (ns)": 21095843, "Min duration satisfied": "Yes", "Min latency (ns)": 14512555, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 47.36, "QPS w/o loadgen overhead": 47.4, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.60014, "characteristics.90th_percentile_latency_ns": 26600140.0, "characteristics.90th_percentile_latency_s": 0.02660014, "characteristics.90th_percentile_latency_us": 26600.14, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.5576905886567809, "characteristics.power.normalized_per_core": 0.06971132358209761, "characteristics.power.normalized_per_processor": 0.5576905886567809, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "953f4e89b4a6da04", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10808280, "90.00 percentile latency (ns)": 17635924, "90th percentile latency (ns)": 17635924, "95.00 percentile latency (ns)": 19864076, "97.00 percentile latency (ns)": 21164633, "99.00 percentile latency (ns)": 23886408, "99.90 percentile latency (ns)": 43315983, "Max latency (ns)": 147077335, "Mean latency (ns)": 12208508, "Min duration satisfied": "Yes", "Min latency (ns)": 8656759, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 81.83, "QPS w/o loadgen overhead": 81.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.635924, "characteristics.90th_percentile_latency_ns": 17635924.0, "characteristics.90th_percentile_latency_s": 0.017635924, "characteristics.90th_percentile_latency_us": 17635.924, "characteristics.accuracy": 69.604, "characteristics.good": 34802, "characteristics.power": 0.24845023333565522, "characteristics.power.normalized_per_core": 0.031056279166956902, "characteristics.power.normalized_per_processor": 0.24845023333565522, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "e44fe79f5304b894", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8903933, "90.00 percentile latency (ns)": 12755434, "90th percentile latency (ns)": 12755434, "95.00 percentile latency (ns)": 14305979, "97.00 percentile latency (ns)": 15233455, "99.00 percentile latency (ns)": 18666456, "99.90 percentile latency (ns)": 39204426, "Max latency (ns)": 82310036, "Mean latency (ns)": 9814902, "Min duration satisfied": "Yes", "Min latency (ns)": 7681346, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 101.69, "QPS w/o loadgen overhead": 101.89, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.755434, "characteristics.90th_percentile_latency_ns": 12755434.0, "characteristics.90th_percentile_latency_s": 0.012755434, "characteristics.90th_percentile_latency_us": 12755.434, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.power": 0.25254798992998206, "characteristics.power.normalized_per_core": 0.03156849874124776, "characteristics.power.normalized_per_processor": 0.25254798992998206, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "a78465aa11f95d53", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11598285, "90.00 percentile latency (ns)": 16323818, "90th percentile latency (ns)": 16323818, "95.00 percentile latency (ns)": 18504613, "97.00 percentile latency (ns)": 20045318, "99.00 percentile latency (ns)": 23341807, "99.90 percentile latency (ns)": 42834237, "Max latency (ns)": 123304072, "Mean latency (ns)": 12565286, "Min duration satisfied": "Yes", "Min latency (ns)": 9537039, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 79.51, "QPS w/o loadgen overhead": 79.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.323818, "characteristics.90th_percentile_latency_ns": 16323818.0, "characteristics.90th_percentile_latency_s": 0.016323818, "characteristics.90th_percentile_latency_us": 16323.818, "characteristics.accuracy": 68.734, "characteristics.good": 34367, "characteristics.power": 0.25417250455082446, "characteristics.power.normalized_per_core": 0.03177156306885306, "characteristics.power.normalized_per_processor": 0.25417250455082446, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "79a1536ff14df67a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3943108, "90.00 percentile latency (ns)": 5910070, "90th percentile latency (ns)": 5910070, "95.00 percentile latency (ns)": 6983490, "97.00 percentile latency (ns)": 7965195, "99.00 percentile latency (ns)": 10565495, "99.90 percentile latency (ns)": 26224802, "Max latency (ns)": 88853610, "Mean latency (ns)": 4519135, "Min duration satisfied": "Yes", "Min latency (ns)": 3322410, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 220.58, "QPS w/o loadgen overhead": 221.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.91007, "characteristics.90th_percentile_latency_ns": 5910070.0, "characteristics.90th_percentile_latency_s": 0.00591007, "characteristics.90th_percentile_latency_us": 5910.07, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.power": 0.10140527246350524, "characteristics.power.normalized_per_core": 0.012675659057938155, "characteristics.power.normalized_per_processor": 0.10140527246350524, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "1284d3cbf4305057", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2193286, "90.00 percentile latency (ns)": 3544742, "90th percentile latency (ns)": 3544742, "95.00 percentile latency (ns)": 4214948, "97.00 percentile latency (ns)": 4773888, "99.00 percentile latency (ns)": 7036779, "99.90 percentile latency (ns)": 21136819, "Max latency (ns)": 81606746, "Mean latency (ns)": 2576407, "Min duration satisfied": "Yes", "Min latency (ns)": 1842614, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 386.65, "QPS w/o loadgen overhead": 388.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.544742, "characteristics.90th_percentile_latency_ns": 3544742.0, "characteristics.90th_percentile_latency_s": 0.003544742, "characteristics.90th_percentile_latency_us": 3544.742, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.power": 0.06114254924781247, "characteristics.power.normalized_per_core": 0.007642818655976559, "characteristics.power.normalized_per_processor": 0.06114254924781247, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "42c59da5e8335d78", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14315235, "90.00 percentile latency (ns)": 19040756, "90th percentile latency (ns)": 19040756, "95.00 percentile latency (ns)": 20308550, "97.00 percentile latency (ns)": 21306300, "99.00 percentile latency (ns)": 26206308, "99.90 percentile latency (ns)": 51444309, "Max latency (ns)": 96473327, "Mean latency (ns)": 15175138, "Min duration satisfied": "Yes", "Min latency (ns)": 11242178, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 65.81, "QPS w/o loadgen overhead": 65.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.040756, "characteristics.90th_percentile_latency_ns": 19040756.0, "characteristics.90th_percentile_latency_s": 0.019040756, "characteristics.90th_percentile_latency_us": 19040.756, "characteristics.accuracy": 71.676, "characteristics.good": 35838, "characteristics.power": 0.40173886309118617, "characteristics.power.normalized_per_core": 0.05021735788639827, "characteristics.power.normalized_per_processor": 0.40173886309118617, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "f8e6e212f6b4482e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1988325, "90.00 percentile latency (ns)": 2998265, "90th percentile latency (ns)": 2998265, "95.00 percentile latency (ns)": 3547392, "97.00 percentile latency (ns)": 3909136, "99.00 percentile latency (ns)": 5479634, "99.90 percentile latency (ns)": 16326948, "Max latency (ns)": 97895517, "Mean latency (ns)": 2260297, "Min duration satisfied": "Yes", "Min latency (ns)": 1647509, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 441.6, "QPS w/o loadgen overhead": 442.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.998265, "characteristics.90th_percentile_latency_ns": 2998265.0, "characteristics.90th_percentile_latency_s": 0.002998265, "characteristics.90th_percentile_latency_us": 2998.265, "characteristics.accuracy": 43.468, "characteristics.good": 21734, "characteristics.power": 0.044879601512369055, "characteristics.power.normalized_per_core": 0.005609950189046132, "characteristics.power.normalized_per_processor": 0.044879601512369055, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "94fce4746389fe64", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 63751339, "90.00 percentile latency (ns)": 76286615, "90th percentile latency (ns)": 76286615, "95.00 percentile latency (ns)": 80711803, "97.00 percentile latency (ns)": 83761760, "99.00 percentile latency (ns)": 91016661, "99.90 percentile latency (ns)": 171047730, "Max latency (ns)": 201351097, "Mean latency (ns)": 64052072, "Min duration satisfied": "Yes", "Min latency (ns)": 48646093, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.61, "QPS w/o loadgen overhead": 15.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 76.286615, "characteristics.90th_percentile_latency_ns": 76286615.0, "characteristics.90th_percentile_latency_s": 0.076286615, "characteristics.90th_percentile_latency_us": 76286.615, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.7779469701414228, "characteristics.power.normalized_per_core": 0.22224337126767785, "characteristics.power.normalized_per_processor": 1.7779469701414228, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.625, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4cc28837a2cf0f40", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10325941, "90.00 percentile latency (ns)": 13457448, "90th percentile latency (ns)": 13457448, "95.00 percentile latency (ns)": 16154810, "97.00 percentile latency (ns)": 17241113, "99.00 percentile latency (ns)": 20476250, "99.90 percentile latency (ns)": 39783919, "Max latency (ns)": 139200805, "Mean latency (ns)": 11167141, "Min duration satisfied": "Yes", "Min latency (ns)": 8860169, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.44, "QPS w/o loadgen overhead": 89.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.457448, "characteristics.90th_percentile_latency_ns": 13457448.0, "characteristics.90th_percentile_latency_s": 0.013457448, "characteristics.90th_percentile_latency_us": 13457.448, "characteristics.accuracy": 70.43, "characteristics.good": 35215, "characteristics.power": 0.22778440520658758, "characteristics.power.normalized_per_core": 0.028473050650823447, "characteristics.power.normalized_per_processor": 0.22778440520658758, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "9993c1ec7cd24e18", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8810711, "90.00 percentile latency (ns)": 13262278, "90th percentile latency (ns)": 13262278, "95.00 percentile latency (ns)": 15494316, "97.00 percentile latency (ns)": 16504859, "99.00 percentile latency (ns)": 19357341, "99.90 percentile latency (ns)": 39296597, "Max latency (ns)": 136397492, "Mean latency (ns)": 9849464, "Min duration satisfied": "Yes", "Min latency (ns)": 7473433, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 101.42, "QPS w/o loadgen overhead": 101.53, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.262278, "characteristics.90th_percentile_latency_ns": 13262278.0, "characteristics.90th_percentile_latency_s": 0.013262278, "characteristics.90th_percentile_latency_us": 13262.278, "characteristics.accuracy": 67.474, "characteristics.good": 33737, "characteristics.power": 0.1998490331019615, "characteristics.power.normalized_per_core": 0.024981129137745188, "characteristics.power.normalized_per_processor": 0.1998490331019615, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "3ff2df2aa4954fda", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8446451, "90.00 percentile latency (ns)": 10151434, "90th percentile latency (ns)": 10151434, "95.00 percentile latency (ns)": 10944666, "97.00 percentile latency (ns)": 12585929, "99.00 percentile latency (ns)": 16119733, "99.90 percentile latency (ns)": 32293832, "Max latency (ns)": 81263623, "Mean latency (ns)": 8952275, "Min duration satisfied": "Yes", "Min latency (ns)": 7197140, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 111.58, "QPS w/o loadgen overhead": 111.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.151434, "characteristics.90th_percentile_latency_ns": 10151434.0, "characteristics.90th_percentile_latency_s": 0.010151434, "characteristics.90th_percentile_latency_us": 10151.434, "characteristics.accuracy": 67.24, "characteristics.good": 33620, "characteristics.power": 0.18305887168088728, "characteristics.power.normalized_per_core": 0.02288235896011091, "characteristics.power.normalized_per_processor": 0.18305887168088728, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "af44f9eb520f452e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5540546, "90.00 percentile latency (ns)": 8239409, "90th percentile latency (ns)": 8239409, "95.00 percentile latency (ns)": 9717285, "97.00 percentile latency (ns)": 10817187, "99.00 percentile latency (ns)": 12993417, "99.90 percentile latency (ns)": 30217515, "Max latency (ns)": 92696539, "Mean latency (ns)": 6279251, "Min duration satisfied": "Yes", "Min latency (ns)": 4636504, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 158.87, "QPS w/o loadgen overhead": 159.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.239409, "characteristics.90th_percentile_latency_ns": 8239409.0, "characteristics.90th_percentile_latency_s": 0.008239409, "characteristics.90th_percentile_latency_us": 8239.409, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.power": 0.15699302386572253, "characteristics.power.normalized_per_core": 0.019624127983215316, "characteristics.power.normalized_per_processor": 0.15699302386572253, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "7280fce617464ea2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4365493, "90.00 percentile latency (ns)": 6893874, "90th percentile latency (ns)": 6893874, "95.00 percentile latency (ns)": 8111629, "97.00 percentile latency (ns)": 9101988, "99.00 percentile latency (ns)": 11314572, "99.90 percentile latency (ns)": 26381125, "Max latency (ns)": 81638393, "Mean latency (ns)": 5068228, "Min duration satisfied": "Yes", "Min latency (ns)": 3580689, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 196.7, "QPS w/o loadgen overhead": 197.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.893874, "characteristics.90th_percentile_latency_ns": 6893874.0, "characteristics.90th_percentile_latency_s": 0.006893874, "characteristics.90th_percentile_latency_us": 6893.874, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.power": 0.1244905844552, "characteristics.power.normalized_per_core": 0.0155613230569, "characteristics.power.normalized_per_processor": 0.1244905844552, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "3efb944877d24592", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3527882, "90.00 percentile latency (ns)": 5098996, "90th percentile latency (ns)": 5098996, "95.00 percentile latency (ns)": 5644430, "97.00 percentile latency (ns)": 6244660, "99.00 percentile latency (ns)": 9220075, "99.90 percentile latency (ns)": 26543955, "Max latency (ns)": 119870983, "Mean latency (ns)": 3966579, "Min duration satisfied": "Yes", "Min latency (ns)": 2913010, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 251.26, "QPS w/o loadgen overhead": 252.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.098996, "characteristics.90th_percentile_latency_ns": 5098996.0, "characteristics.90th_percentile_latency_s": 0.005098996, "characteristics.90th_percentile_latency_us": 5098.996, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.power": 0.09345928420002496, "characteristics.power.normalized_per_core": 0.01168241052500312, "characteristics.power.normalized_per_processor": 0.09345928420002496, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "99ea2bb54475d887", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5850949, "90.00 percentile latency (ns)": 8744358, "90th percentile latency (ns)": 8744358, "95.00 percentile latency (ns)": 10179398, "97.00 percentile latency (ns)": 11212372, "99.00 percentile latency (ns)": 13646881, "99.90 percentile latency (ns)": 31531774, "Max latency (ns)": 79257967, "Mean latency (ns)": 6607980, "Min duration satisfied": "Yes", "Min latency (ns)": 4755924, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 150.97, "QPS w/o loadgen overhead": 151.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.744358, "characteristics.90th_percentile_latency_ns": 8744358.0, "characteristics.90th_percentile_latency_s": 0.008744358, "characteristics.90th_percentile_latency_us": 8744.358, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.power": 0.16697798679649384, "characteristics.power.normalized_per_core": 0.02087224834956173, "characteristics.power.normalized_per_processor": 0.16697798679649384, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4d21a8a7e52f0adb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2613460, "90.00 percentile latency (ns)": 3881941, "90th percentile latency (ns)": 3881941, "95.00 percentile latency (ns)": 4463845, "97.00 percentile latency (ns)": 5076224, "99.00 percentile latency (ns)": 7736857, "99.90 percentile latency (ns)": 18208961, "Max latency (ns)": 105302971, "Mean latency (ns)": 2977990, "Min duration satisfied": "Yes", "Min latency (ns)": 2266884, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 335.15, "QPS w/o loadgen overhead": 335.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.881941, "characteristics.90th_percentile_latency_ns": 3881941.0, "characteristics.90th_percentile_latency_s": 0.003881941, "characteristics.90th_percentile_latency_us": 3881.941, "characteristics.accuracy": 49.11, "characteristics.good": 24555, "characteristics.power": 0.06009570427305037, "characteristics.power.normalized_per_core": 0.007511963034131296, "characteristics.power.normalized_per_processor": 0.06009570427305037, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "d854a90aa213bcb6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5092801, "90.00 percentile latency (ns)": 7258691, "90th percentile latency (ns)": 7258691, "95.00 percentile latency (ns)": 9254396, "97.00 percentile latency (ns)": 10704896, "99.00 percentile latency (ns)": 12977216, "99.90 percentile latency (ns)": 28647297, "Max latency (ns)": 119657356, "Mean latency (ns)": 5841650, "Min duration satisfied": "Yes", "Min latency (ns)": 4493898, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 170.93, "QPS w/o loadgen overhead": 171.18, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.258691, "characteristics.90th_percentile_latency_ns": 7258691.0, "characteristics.90th_percentile_latency_s": 0.007258691, "characteristics.90th_percentile_latency_us": 7258.691, "characteristics.accuracy": 62.07, "characteristics.good": 31035, "characteristics.power": 0.11446401408780302, "characteristics.power.normalized_per_core": 0.014308001760975377, "characteristics.power.normalized_per_processor": 0.11446401408780302, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "6c38ec7bd467f8cc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3510516, "90.00 percentile latency (ns)": 5990814, "90th percentile latency (ns)": 5990814, "95.00 percentile latency (ns)": 7273493, "97.00 percentile latency (ns)": 8260874, "99.00 percentile latency (ns)": 10812067, "99.90 percentile latency (ns)": 27799791, "Max latency (ns)": 131605063, "Mean latency (ns)": 4252716, "Min duration satisfied": "Yes", "Min latency (ns)": 2743608, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 234.24, "QPS w/o loadgen overhead": 235.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.990814, "characteristics.90th_percentile_latency_ns": 5990814.0, "characteristics.90th_percentile_latency_s": 0.005990814, "characteristics.90th_percentile_latency_us": 5990.814, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.power": 0.10274510724709456, "characteristics.power.normalized_per_core": 0.01284313840588682, "characteristics.power.normalized_per_processor": 0.10274510724709456, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "44cf381c45d3b72f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1638246, "90.00 percentile latency (ns)": 2394116, "90th percentile latency (ns)": 2394116, "95.00 percentile latency (ns)": 2891867, "97.00 percentile latency (ns)": 3256167, "99.00 percentile latency (ns)": 4250924, "99.90 percentile latency (ns)": 13507713, "Max latency (ns)": 74718203, "Mean latency (ns)": 1834437, "Min duration satisfied": "Yes", "Min latency (ns)": 1275382, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 543.92, "QPS w/o loadgen overhead": 545.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.394116, "characteristics.90th_percentile_latency_ns": 2394116.0, "characteristics.90th_percentile_latency_s": 0.002394116, "characteristics.90th_percentile_latency_us": 2394.116, "characteristics.accuracy": 42.384, "characteristics.good": 21192, "characteristics.power": 0.03592407381191824, "characteristics.power.normalized_per_core": 0.00449050922648978, "characteristics.power.normalized_per_processor": 0.03592407381191824, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "45a1a2d3791d1eff", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16724110, "90.00 percentile latency (ns)": 22841394, "90th percentile latency (ns)": 22841394, "95.00 percentile latency (ns)": 24206036, "97.00 percentile latency (ns)": 25484979, "99.00 percentile latency (ns)": 31510818, "99.90 percentile latency (ns)": 48167236, "Max latency (ns)": 144601871, "Mean latency (ns)": 18074075, "Min duration satisfied": "Yes", "Min latency (ns)": 13240963, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 55.26, "QPS w/o loadgen overhead": 55.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.841394, "characteristics.90th_percentile_latency_ns": 22841394.0, "characteristics.90th_percentile_latency_s": 0.022841394, "characteristics.90th_percentile_latency_us": 22841.394, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.power": 0.4732069239849046, "characteristics.power.normalized_per_core": 0.059150865498113075, "characteristics.power.normalized_per_processor": 0.4732069239849046, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "ad4a4b8ced20715e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4900052, "90.00 percentile latency (ns)": 7167834, "90th percentile latency (ns)": 7167834, "95.00 percentile latency (ns)": 9021415, "97.00 percentile latency (ns)": 10341125, "99.00 percentile latency (ns)": 12514946, "99.90 percentile latency (ns)": 28193197, "Max latency (ns)": 84466521, "Mean latency (ns)": 5604654, "Min duration satisfied": "Yes", "Min latency (ns)": 4203000, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 178.12, "QPS w/o loadgen overhead": 178.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.167834, "characteristics.90th_percentile_latency_ns": 7167834.0, "characteristics.90th_percentile_latency_s": 0.007167834, "characteristics.90th_percentile_latency_us": 7167.834, "characteristics.accuracy": 64.486, "characteristics.good": 32243, "characteristics.power": 0.1175621714582994, "characteristics.power.normalized_per_core": 0.014695271432287426, "characteristics.power.normalized_per_processor": 0.1175621714582994, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "fe4e0da6818510aa", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 23141503, "90.00 percentile latency (ns)": 31213763, "90th percentile latency (ns)": 31213763, "95.00 percentile latency (ns)": 33347777, "97.00 percentile latency (ns)": 34967082, "99.00 percentile latency (ns)": 40400819, "99.90 percentile latency (ns)": 65093580, "Max latency (ns)": 159535848, "Mean latency (ns)": 24855275, "Min duration satisfied": "Yes", "Min latency (ns)": 19252331, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 40.2, "QPS w/o loadgen overhead": 40.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 31.213763, "characteristics.90th_percentile_latency_ns": 31213763.0, "characteristics.90th_percentile_latency_s": 0.031213763, "characteristics.90th_percentile_latency_us": 31213.763, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.666459757385989, "characteristics.power.normalized_per_core": 0.08330746967324862, "characteristics.power.normalized_per_processor": 0.666459757385989, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "842f898b904795bf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2690970, "90.00 percentile latency (ns)": 3947089, "90th percentile latency (ns)": 3947089, "95.00 percentile latency (ns)": 4564684, "97.00 percentile latency (ns)": 5205895, "99.00 percentile latency (ns)": 7363082, "99.90 percentile latency (ns)": 19382632, "Max latency (ns)": 71899824, "Mean latency (ns)": 3054344, "Min duration satisfied": "Yes", "Min latency (ns)": 2348265, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 326.88, "QPS w/o loadgen overhead": 327.4, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.947089, "characteristics.90th_percentile_latency_ns": 3947089.0, "characteristics.90th_percentile_latency_s": 0.003947089, "characteristics.90th_percentile_latency_us": 3947.089, "characteristics.accuracy": 56.75, "characteristics.good": 28375, "characteristics.power": 0.06088628919427135, "characteristics.power.normalized_per_core": 0.007610786149283919, "characteristics.power.normalized_per_processor": 0.06088628919427135, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "f140c8a813a29404", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3709031, "90.00 percentile latency (ns)": 5334928, "90th percentile latency (ns)": 5334928, "95.00 percentile latency (ns)": 6123919, "97.00 percentile latency (ns)": 7181475, "99.00 percentile latency (ns)": 10110403, "99.90 percentile latency (ns)": 23339836, "Max latency (ns)": 132130634, "Mean latency (ns)": 4216725, "Min duration satisfied": "Yes", "Min latency (ns)": 3105034, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 236.84, "QPS w/o loadgen overhead": 237.15, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.334928, "characteristics.90th_percentile_latency_ns": 5334928.0, "characteristics.90th_percentile_latency_s": 0.005334928, "characteristics.90th_percentile_latency_us": 5334.928, "characteristics.accuracy": 57.002, "characteristics.good": 28501, "characteristics.power": 0.08386246178790381, "characteristics.power.normalized_per_core": 0.010482807723487976, "characteristics.power.normalized_per_processor": 0.08386246178790381, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "2c17d8dbfb9470f9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15464923, "90.00 percentile latency (ns)": 21046135, "90th percentile latency (ns)": 21046135, "95.00 percentile latency (ns)": 22797987, "97.00 percentile latency (ns)": 24176162, "99.00 percentile latency (ns)": 29478900, "99.90 percentile latency (ns)": 53922267, "Max latency (ns)": 157541099, "Mean latency (ns)": 16572887, "Min duration satisfied": "Yes", "Min latency (ns)": 13119439, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 60.28, "QPS w/o loadgen overhead": 60.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.046135, "characteristics.90th_percentile_latency_ns": 21046135.0, "characteristics.90th_percentile_latency_s": 0.021046135, "characteristics.90th_percentile_latency_us": 21046.135, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.power": 0.44725892400905154, "characteristics.power.normalized_per_core": 0.05590736550113144, "characteristics.power.normalized_per_processor": 0.44725892400905154, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "7ce2a44861915233", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1961458, "90.00 percentile latency (ns)": 3135782, "90th percentile latency (ns)": 3135782, "95.00 percentile latency (ns)": 4015116, "97.00 percentile latency (ns)": 4495677, "99.00 percentile latency (ns)": 6743458, "99.90 percentile latency (ns)": 19423306, "Max latency (ns)": 108674570, "Mean latency (ns)": 2311563, "Min duration satisfied": "Yes", "Min latency (ns)": 1575392, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 430.61, "QPS w/o loadgen overhead": 432.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.135782, "characteristics.90th_percentile_latency_ns": 3135782.0, "characteristics.90th_percentile_latency_s": 0.003135782, "characteristics.90th_percentile_latency_us": 3135.782, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.power": 0.05309222300663546, "characteristics.power.normalized_per_core": 0.006636527875829432, "characteristics.power.normalized_per_processor": 0.05309222300663546, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "bddc65e8e2fd4cae", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8329839, "90.00 percentile latency (ns)": 10870741, "90th percentile latency (ns)": 10870741, "95.00 percentile latency (ns)": 13082354, "97.00 percentile latency (ns)": 14579438, "99.00 percentile latency (ns)": 17455318, "99.90 percentile latency (ns)": 35811343, "Max latency (ns)": 116077835, "Mean latency (ns)": 9040099, "Min duration satisfied": "Yes", "Min latency (ns)": 7282705, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 110.41, "QPS w/o loadgen overhead": 110.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.870741, "characteristics.90th_percentile_latency_ns": 10870741.0, "characteristics.90th_percentile_latency_s": 0.010870741, "characteristics.90th_percentile_latency_us": 10870.741, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.power": 0.22525088761683926, "characteristics.power.normalized_per_core": 0.028156360952104907, "characteristics.power.normalized_per_processor": 0.22525088761683926, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "3941858e66b2e472", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4590835, "90.00 percentile latency (ns)": 6853820, "90th percentile latency (ns)": 6853820, "95.00 percentile latency (ns)": 8131926, "97.00 percentile latency (ns)": 9103555, "99.00 percentile latency (ns)": 11757852, "99.90 percentile latency (ns)": 29801438, "Max latency (ns)": 91455473, "Mean latency (ns)": 5295949, "Min duration satisfied": "Yes", "Min latency (ns)": 4040025, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 188.21, "QPS w/o loadgen overhead": 188.82, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.85382, "characteristics.90th_percentile_latency_ns": 6853820.0, "characteristics.90th_percentile_latency_s": 0.00685382, "characteristics.90th_percentile_latency_us": 6853.82, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.power": 0.14167277673286782, "characteristics.power.normalized_per_core": 0.017709097091608478, "characteristics.power.normalized_per_processor": 0.14167277673286782, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "95b5349818a46cb3", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7536536, "90.00 percentile latency (ns)": 10020328, "90th percentile latency (ns)": 10020328, "95.00 percentile latency (ns)": 11864028, "97.00 percentile latency (ns)": 13036786, "99.00 percentile latency (ns)": 15834801, "99.90 percentile latency (ns)": 34042350, "Max latency (ns)": 81855822, "Mean latency (ns)": 8146372, "Min duration satisfied": "Yes", "Min latency (ns)": 6472263, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 122.46, "QPS w/o loadgen overhead": 122.75, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.020328, "characteristics.90th_percentile_latency_ns": 10020328.0, "characteristics.90th_percentile_latency_s": 0.010020328, "characteristics.90th_percentile_latency_us": 10020.328, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.power": 0.2151598292831635, "characteristics.power.normalized_per_core": 0.026894978660395436, "characteristics.power.normalized_per_processor": 0.2151598292831635, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "bc7f3104586beade", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3129905, "90.00 percentile latency (ns)": 5096845, "90th percentile latency (ns)": 5096845, "95.00 percentile latency (ns)": 6165277, "97.00 percentile latency (ns)": 7178828, "99.00 percentile latency (ns)": 9902378, "99.90 percentile latency (ns)": 27056758, "Max latency (ns)": 118466272, "Mean latency (ns)": 3718475, "Min duration satisfied": "Yes", "Min latency (ns)": 2310763, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 267.97, "QPS w/o loadgen overhead": 268.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.096845, "characteristics.90th_percentile_latency_ns": 5096845.0, "characteristics.90th_percentile_latency_s": 0.005096845, "characteristics.90th_percentile_latency_us": 5096.845, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.power": 0.08515786651938599, "characteristics.power.normalized_per_core": 0.010644733314923249, "characteristics.power.normalized_per_processor": 0.08515786651938599, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "324dbad3641beb55", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4726689, "90.00 percentile latency (ns)": 6070641, "90th percentile latency (ns)": 6070641, "95.00 percentile latency (ns)": 7117619, "97.00 percentile latency (ns)": 8207291, "99.00 percentile latency (ns)": 11350114, "99.90 percentile latency (ns)": 27219152, "Max latency (ns)": 122064324, "Mean latency (ns)": 5174687, "Min duration satisfied": "Yes", "Min latency (ns)": 4133674, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 192.67, "QPS w/o loadgen overhead": 193.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.070641, "characteristics.90th_percentile_latency_ns": 6070641.0, "characteristics.90th_percentile_latency_s": 0.006070641, "characteristics.90th_percentile_latency_us": 6070.641, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.power": 0.12228502325195159, "characteristics.power.normalized_per_core": 0.015285627906493949, "characteristics.power.normalized_per_processor": 0.12228502325195159, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "08af2a22a14371a6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7184235, "90.00 percentile latency (ns)": 11062079, "90th percentile latency (ns)": 11062079, "95.00 percentile latency (ns)": 12490657, "97.00 percentile latency (ns)": 13423082, "99.00 percentile latency (ns)": 16395381, "99.90 percentile latency (ns)": 34629373, "Max latency (ns)": 126881056, "Mean latency (ns)": 8071022, "Min duration satisfied": "Yes", "Min latency (ns)": 5572256, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 123.65, "QPS w/o loadgen overhead": 123.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.062079, "characteristics.90th_percentile_latency_ns": 11062079.0, "characteristics.90th_percentile_latency_s": 0.011062079, "characteristics.90th_percentile_latency_us": 11062.079, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.power": 0.20151882763975165, "characteristics.power.normalized_per_core": 0.025189853454968957, "characteristics.power.normalized_per_processor": 0.20151882763975165, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "afe41c19c99c1794", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15548639, "90.00 percentile latency (ns)": 22814981, "90th percentile latency (ns)": 22814981, "95.00 percentile latency (ns)": 26046171, "97.00 percentile latency (ns)": 28580587, "99.00 percentile latency (ns)": 32060569, "99.90 percentile latency (ns)": 53223086, "Max latency (ns)": 116097645, "Mean latency (ns)": 17228375, "Min duration satisfied": "Yes", "Min latency (ns)": 12672201, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.99, "QPS w/o loadgen overhead": 58.04, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.814981, "characteristics.90th_percentile_latency_ns": 22814981.0, "characteristics.90th_percentile_latency_s": 0.022814981, "characteristics.90th_percentile_latency_us": 22814.981, "characteristics.accuracy": 71.19, "characteristics.good": 35595, "characteristics.power": 0.36032495861498115, "characteristics.power.normalized_per_core": 0.045040619826872644, "characteristics.power.normalized_per_processor": 0.36032495861498115, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 52.6316, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "dae6bba263b0633f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 37212736, "90.00 percentile latency (ns)": 47939220, "90th percentile latency (ns)": 47939220, "95.00 percentile latency (ns)": 50026309, "97.00 percentile latency (ns)": 51663493, "99.00 percentile latency (ns)": 59581559, "99.90 percentile latency (ns)": 112591195, "Max latency (ns)": 180817905, "Mean latency (ns)": 39322589, "Min duration satisfied": "Yes", "Min latency (ns)": 29585939, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 25.42, "QPS w/o loadgen overhead": 25.43, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 47.93922, "characteristics.90th_percentile_latency_ns": 47939220.0, "characteristics.90th_percentile_latency_s": 0.04793922, "characteristics.90th_percentile_latency_us": 47939.22, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 1.0711029627764492, "characteristics.power.normalized_per_core": 0.13388787034705615, "characteristics.power.normalized_per_processor": 1.0711029627764492, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 28.5714, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "d1d4ca0b9474c930", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4405241, "90.00 percentile latency (ns)": 5623270, "90th percentile latency (ns)": 5623270, "95.00 percentile latency (ns)": 6657477, "97.00 percentile latency (ns)": 7591962, "99.00 percentile latency (ns)": 10811891, "99.90 percentile latency (ns)": 26974855, "Max latency (ns)": 107788566, "Mean latency (ns)": 4837098, "Min duration satisfied": "Yes", "Min latency (ns)": 3874619, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 206.1, "QPS w/o loadgen overhead": 206.74, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.62327, "characteristics.90th_percentile_latency_ns": 5623270.0, "characteristics.90th_percentile_latency_s": 0.00562327, "characteristics.90th_percentile_latency_us": 5623.27, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.power": 0.11037303897784252, "characteristics.power.normalized_per_core": 0.013796629872230315, "characteristics.power.normalized_per_processor": 0.11037303897784252, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "f5a082d0af01c8c2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 48000961, "90.00 percentile latency (ns)": 59108080, "90th percentile latency (ns)": 59108080, "95.00 percentile latency (ns)": 61944471, "97.00 percentile latency (ns)": 64115036, "99.00 percentile latency (ns)": 71086374, "99.90 percentile latency (ns)": 123854891, "Max latency (ns)": 169733581, "Mean latency (ns)": 49883475, "Min duration satisfied": "Yes", "Min latency (ns)": 39359594, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.04, "QPS w/o loadgen overhead": 20.05, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 59.10808, "characteristics.90th_percentile_latency_ns": 59108080.0, "characteristics.90th_percentile_latency_s": 0.05910808, "characteristics.90th_percentile_latency_us": 59108.08, "characteristics.accuracy": 76.344, "characteristics.good": 38172, "characteristics.power": 1.0463688922161536, "characteristics.power.normalized_per_core": 0.1307961115270192, "characteristics.power.normalized_per_processor": 1.0463688922161536, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "3a6628ccc04729b9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3630537, "90.00 percentile latency (ns)": 5116846, "90th percentile latency (ns)": 5116846, "95.00 percentile latency (ns)": 5861774, "97.00 percentile latency (ns)": 7152139, "99.00 percentile latency (ns)": 10289950, "99.90 percentile latency (ns)": 22474325, "Max latency (ns)": 107298300, "Mean latency (ns)": 4095315, "Min duration satisfied": "Yes", "Min latency (ns)": 3041709, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 243.82, "QPS w/o loadgen overhead": 244.18, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.116846, "characteristics.90th_percentile_latency_ns": 5116846.0, "characteristics.90th_percentile_latency_s": 0.005116846, "characteristics.90th_percentile_latency_us": 5116.846, "characteristics.accuracy": 54.568, "characteristics.good": 27284, "characteristics.power": 0.0817724550898204, "characteristics.power.normalized_per_core": 0.01022155688622755, "characteristics.power.normalized_per_processor": 0.0817724550898204, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "09b6f7ec55ffcb71", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2501413, "90.00 percentile latency (ns)": 3277252, "90th percentile latency (ns)": 3277252, "95.00 percentile latency (ns)": 3731992, "97.00 percentile latency (ns)": 4267656, "99.00 percentile latency (ns)": 5986151, "99.90 percentile latency (ns)": 17350855, "Max latency (ns)": 86733421, "Mean latency (ns)": 2730931, "Min duration satisfied": "Yes", "Min latency (ns)": 2120819, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 365.22, "QPS w/o loadgen overhead": 366.18, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.277252, "characteristics.90th_percentile_latency_ns": 3277252.0, "characteristics.90th_percentile_latency_s": 0.003277252, "characteristics.90th_percentile_latency_us": 3277.252, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.power": 0.061797771011651535, "characteristics.power.normalized_per_core": 0.007724721376456442, "characteristics.power.normalized_per_processor": 0.061797771011651535, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "d9c34a2a8f5add30", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10585532, "90.00 percentile latency (ns)": 12770514, "90th percentile latency (ns)": 12770514, "95.00 percentile latency (ns)": 15206411, "97.00 percentile latency (ns)": 16584117, "99.00 percentile latency (ns)": 19307427, "99.90 percentile latency (ns)": 40651492, "Max latency (ns)": 92449624, "Mean latency (ns)": 11226998, "Min duration satisfied": "Yes", "Min latency (ns)": 9133625, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 88.99, "QPS w/o loadgen overhead": 89.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.770514, "characteristics.90th_percentile_latency_ns": 12770514.0, "characteristics.90th_percentile_latency_s": 0.012770514, "characteristics.90th_percentile_latency_us": 12770.514, "characteristics.accuracy": 68.126, "characteristics.good": 34063, "characteristics.power": 0.22981290378406552, "characteristics.power.normalized_per_core": 0.02872661297300819, "characteristics.power.normalized_per_processor": 0.22981290378406552, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "5402761c341278f0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10797839, "90.00 percentile latency (ns)": 15940268, "90th percentile latency (ns)": 15940268, "95.00 percentile latency (ns)": 17383854, "97.00 percentile latency (ns)": 18298840, "99.00 percentile latency (ns)": 22575078, "99.90 percentile latency (ns)": 40797362, "Max latency (ns)": 142581766, "Mean latency (ns)": 11984913, "Min duration satisfied": "Yes", "Min latency (ns)": 8960269, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 83.32, "QPS w/o loadgen overhead": 83.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.940268, "characteristics.90th_percentile_latency_ns": 15940268.0, "characteristics.90th_percentile_latency_s": 0.015940268, "characteristics.90th_percentile_latency_us": 15940.268, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.power": 0.30112926675676444, "characteristics.power.normalized_per_core": 0.037641158344595554, "characteristics.power.normalized_per_processor": 0.30112926675676444, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "14f6b900d0244ebc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5652875, "90.00 percentile latency (ns)": 7659301, "90th percentile latency (ns)": 7659301, "95.00 percentile latency (ns)": 9181394, "97.00 percentile latency (ns)": 10583316, "99.00 percentile latency (ns)": 13377745, "99.90 percentile latency (ns)": 29638953, "Max latency (ns)": 125500503, "Mean latency (ns)": 6267894, "Min duration satisfied": "Yes", "Min latency (ns)": 4845056, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 159.14, "QPS w/o loadgen overhead": 159.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.659301, "characteristics.90th_percentile_latency_ns": 7659301.0, "characteristics.90th_percentile_latency_s": 0.007659301, "characteristics.90th_percentile_latency_us": 7659.301, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.power": 0.15090590524545325, "characteristics.power.normalized_per_core": 0.018863238155681656, "characteristics.power.normalized_per_processor": 0.15090590524545325, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "c846f582c840d870", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7005742, "90.00 percentile latency (ns)": 9184729, "90th percentile latency (ns)": 9184729, "95.00 percentile latency (ns)": 11226168, "97.00 percentile latency (ns)": 12639710, "99.00 percentile latency (ns)": 15337657, "99.90 percentile latency (ns)": 33539216, "Max latency (ns)": 79155877, "Mean latency (ns)": 7634506, "Min duration satisfied": "Yes", "Min latency (ns)": 5847607, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 130.79, "QPS w/o loadgen overhead": 130.98, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.184729, "characteristics.90th_percentile_latency_ns": 9184729.0, "characteristics.90th_percentile_latency_s": 0.009184729, "characteristics.90th_percentile_latency_us": 9184.729, "characteristics.accuracy": 64.768, "characteristics.good": 32384, "characteristics.power": 0.1556591633725064, "characteristics.power.normalized_per_core": 0.0194573954215633, "characteristics.power.normalized_per_processor": 0.1556591633725064, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "5284afd64c5bb131", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9022807, "90.00 percentile latency (ns)": 13695322, "90th percentile latency (ns)": 13695322, "95.00 percentile latency (ns)": 15096466, "97.00 percentile latency (ns)": 15996122, "99.00 percentile latency (ns)": 20128454, "99.90 percentile latency (ns)": 37414771, "Max latency (ns)": 133446223, "Mean latency (ns)": 10139688, "Min duration satisfied": "Yes", "Min latency (ns)": 7265133, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 98.45, "QPS w/o loadgen overhead": 98.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.695322, "characteristics.90th_percentile_latency_ns": 13695322.0, "characteristics.90th_percentile_latency_s": 0.013695322, "characteristics.90th_percentile_latency_us": 13695.322, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.power": 0.25184860907402956, "characteristics.power.normalized_per_core": 0.031481076134253695, "characteristics.power.normalized_per_processor": 0.25184860907402956, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "17b7049d89691b63", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6292066, "90.00 percentile latency (ns)": 8373174, "90th percentile latency (ns)": 8373174, "95.00 percentile latency (ns)": 10259658, "97.00 percentile latency (ns)": 11653292, "99.00 percentile latency (ns)": 13798485, "99.90 percentile latency (ns)": 29061929, "Max latency (ns)": 74114720, "Mean latency (ns)": 6968849, "Min duration satisfied": "Yes", "Min latency (ns)": 5517718, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 143.32, "QPS w/o loadgen overhead": 143.5, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.373174, "characteristics.90th_percentile_latency_ns": 8373174.0, "characteristics.90th_percentile_latency_s": 0.008373174, "characteristics.90th_percentile_latency_us": 8373.174, "characteristics.accuracy": 64.08, "characteristics.good": 32040, "characteristics.power": 0.1415159697559593, "characteristics.power.normalized_per_core": 0.01768949621949491, "characteristics.power.normalized_per_processor": 0.1415159697559593, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "2614e8db213118d4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5041484, "90.00 percentile latency (ns)": 7466022, "90th percentile latency (ns)": 7466022, "95.00 percentile latency (ns)": 8867814, "97.00 percentile latency (ns)": 9945465, "99.00 percentile latency (ns)": 12317130, "99.90 percentile latency (ns)": 29017584, "Max latency (ns)": 117524865, "Mean latency (ns)": 5673049, "Min duration satisfied": "Yes", "Min latency (ns)": 4022145, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 175.85, "QPS w/o loadgen overhead": 176.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.466022, "characteristics.90th_percentile_latency_ns": 7466022.0, "characteristics.90th_percentile_latency_s": 0.007466022, "characteristics.90th_percentile_latency_us": 7466.022, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.power": 0.13143557693765826, "characteristics.power.normalized_per_core": 0.016429447117207282, "characteristics.power.normalized_per_processor": 0.13143557693765826, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "35e93647f2979d97", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8724291, "90.00 percentile latency (ns)": 13120734, "90th percentile latency (ns)": 13120734, "95.00 percentile latency (ns)": 14638053, "97.00 percentile latency (ns)": 15580947, "99.00 percentile latency (ns)": 19400276, "99.90 percentile latency (ns)": 37184911, "Max latency (ns)": 134644753, "Mean latency (ns)": 9739318, "Min duration satisfied": "Yes", "Min latency (ns)": 7056600, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 102.49, "QPS w/o loadgen overhead": 102.68, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.120734, "characteristics.90th_percentile_latency_ns": 13120734.0, "characteristics.90th_percentile_latency_s": 0.013120734, "characteristics.90th_percentile_latency_us": 13120.734, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.power": 0.24285021986313823, "characteristics.power.normalized_per_core": 0.03035627748289228, "characteristics.power.normalized_per_processor": 0.24285021986313823, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "f94a2427a89e1af7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6705487, "90.00 percentile latency (ns)": 10261327, "90th percentile latency (ns)": 10261327, "95.00 percentile latency (ns)": 12765666, "97.00 percentile latency (ns)": 13826000, "99.00 percentile latency (ns)": 15787880, "99.90 percentile latency (ns)": 32885455, "Max latency (ns)": 125173117, "Mean latency (ns)": 7633632, "Min duration satisfied": "Yes", "Min latency (ns)": 5751780, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 130.83, "QPS w/o loadgen overhead": 131.0, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.261327, "characteristics.90th_percentile_latency_ns": 10261327.0, "characteristics.90th_percentile_latency_s": 0.010261327, "characteristics.90th_percentile_latency_us": 10261.327, "characteristics.accuracy": 64.972, "characteristics.good": 32486, "characteristics.power": 0.15442211317735852, "characteristics.power.normalized_per_core": 0.019302764147169815, "characteristics.power.normalized_per_processor": 0.15442211317735852, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "3e2144e1f82716c6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11425473, "90.00 percentile latency (ns)": 16676588, "90th percentile latency (ns)": 16676588, "95.00 percentile latency (ns)": 18071019, "97.00 percentile latency (ns)": 19099161, "99.00 percentile latency (ns)": 23715208, "99.90 percentile latency (ns)": 48870165, "Max latency (ns)": 168200761, "Mean latency (ns)": 12604965, "Min duration satisfied": "Yes", "Min latency (ns)": 8956146, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 79.21, "QPS w/o loadgen overhead": 79.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.676588, "characteristics.90th_percentile_latency_ns": 16676588.0, "characteristics.90th_percentile_latency_s": 0.016676588, "characteristics.90th_percentile_latency_us": 16676.588, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.power": 0.3230559697080259, "characteristics.power.normalized_per_core": 0.04038199621350324, "characteristics.power.normalized_per_processor": 0.3230559697080259, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "f746e58f5ebbdb3a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5342410, "90.00 percentile latency (ns)": 8618986, "90th percentile latency (ns)": 8618986, "95.00 percentile latency (ns)": 10212894, "97.00 percentile latency (ns)": 11343877, "99.00 percentile latency (ns)": 13594420, "99.90 percentile latency (ns)": 31036232, "Max latency (ns)": 130546550, "Mean latency (ns)": 6256980, "Min duration satisfied": "Yes", "Min latency (ns)": 4293604, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 159.39, "QPS w/o loadgen overhead": 159.82, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.618986, "characteristics.90th_percentile_latency_ns": 8618986.0, "characteristics.90th_percentile_latency_s": 0.008618986, "characteristics.90th_percentile_latency_us": 8618.986, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.power": 0.15159491484307025, "characteristics.power.normalized_per_core": 0.01894936435538378, "characteristics.power.normalized_per_processor": 0.15159491484307025, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "b684259b0c1903b2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1773711, "90.00 percentile latency (ns)": 2650712, "90th percentile latency (ns)": 2650712, "95.00 percentile latency (ns)": 3560000, "97.00 percentile latency (ns)": 3873199, "99.00 percentile latency (ns)": 5433365, "99.90 percentile latency (ns)": 18785197, "Max latency (ns)": 89497696, "Mean latency (ns)": 2034427, "Min duration satisfied": "Yes", "Min latency (ns)": 1345853, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 489.57, "QPS w/o loadgen overhead": 491.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.650712, "characteristics.90th_percentile_latency_ns": 2650712.0, "characteristics.90th_percentile_latency_s": 0.002650712, "characteristics.90th_percentile_latency_us": 2650.712, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.power": 0.04308407972901672, "characteristics.power.normalized_per_core": 0.00538550996612709, "characteristics.power.normalized_per_processor": 0.04308407972901672, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "e2f28b1a49978070", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2956035, "90.00 percentile latency (ns)": 4418372, "90th percentile latency (ns)": 4418372, "95.00 percentile latency (ns)": 5054113, "97.00 percentile latency (ns)": 5663004, "99.00 percentile latency (ns)": 8560222, "99.90 percentile latency (ns)": 23244069, "Max latency (ns)": 103654710, "Mean latency (ns)": 3353959, "Min duration satisfied": "Yes", "Min latency (ns)": 2416011, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 296.99, "QPS w/o loadgen overhead": 298.16, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.418372, "characteristics.90th_percentile_latency_ns": 4418372.0, "characteristics.90th_percentile_latency_s": 0.004418372, "characteristics.90th_percentile_latency_us": 4418.372, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.power": 0.07696243981278829, "characteristics.power.normalized_per_core": 0.009620304976598536, "characteristics.power.normalized_per_processor": 0.07696243981278829, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "7b98196e47bb8287", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3633383, "90.00 percentile latency (ns)": 5577377, "90th percentile latency (ns)": 5577377, "95.00 percentile latency (ns)": 6650802, "97.00 percentile latency (ns)": 7561692, "99.00 percentile latency (ns)": 9975435, "99.90 percentile latency (ns)": 26043727, "Max latency (ns)": 73759585, "Mean latency (ns)": 4235892, "Min duration satisfied": "Yes", "Min latency (ns)": 3121776, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 235.16, "QPS w/o loadgen overhead": 236.08, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.577377, "characteristics.90th_percentile_latency_ns": 5577377.0, "characteristics.90th_percentile_latency_s": 0.005577377, "characteristics.90th_percentile_latency_us": 5577.377, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.power": 0.10851625843397397, "characteristics.power.normalized_per_core": 0.013564532304246747, "characteristics.power.normalized_per_processor": 0.10851625843397397, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "879870cb74f6d984", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3368697, "90.00 percentile latency (ns)": 4727221, "90th percentile latency (ns)": 4727221, "95.00 percentile latency (ns)": 5263181, "97.00 percentile latency (ns)": 5827690, "99.00 percentile latency (ns)": 8678150, "99.90 percentile latency (ns)": 22506781, "Max latency (ns)": 117154503, "Mean latency (ns)": 3757035, "Min duration satisfied": "Yes", "Min latency (ns)": 2794846, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 265.7, "QPS w/o loadgen overhead": 266.17, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.727221, "characteristics.90th_percentile_latency_ns": 4727221.0, "characteristics.90th_percentile_latency_s": 0.004727221, "characteristics.90th_percentile_latency_us": 4727.221, "characteristics.accuracy": 55.54, "characteristics.good": 27770, "characteristics.power": 0.07446426241519126, "characteristics.power.normalized_per_core": 0.009308032801898907, "characteristics.power.normalized_per_processor": 0.07446426241519126, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "93f909fc433f4bb5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3849786, "90.00 percentile latency (ns)": 5387489, "90th percentile latency (ns)": 5387489, "95.00 percentile latency (ns)": 6406485, "97.00 percentile latency (ns)": 7427270, "99.00 percentile latency (ns)": 10357904, "99.90 percentile latency (ns)": 25522997, "Max latency (ns)": 136669675, "Mean latency (ns)": 4344322, "Min duration satisfied": "Yes", "Min latency (ns)": 3260443, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 229.44, "QPS w/o loadgen overhead": 230.19, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.387489, "characteristics.90th_percentile_latency_ns": 5387489.0, "characteristics.90th_percentile_latency_s": 0.005387489, "characteristics.90th_percentile_latency_us": 5387.489, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.power": 0.09920712094004426, "characteristics.power.normalized_per_core": 0.012400890117505533, "characteristics.power.normalized_per_processor": 0.09920712094004426, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "aea666e4a3f9223b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30469794, "90.00 percentile latency (ns)": 104486530, "90th percentile latency (ns)": 104486530, "95.00 percentile latency (ns)": 120078260, "97.00 percentile latency (ns)": 124319548, "99.00 percentile latency (ns)": 131195289, "99.90 percentile latency (ns)": 140987109, "Max latency (ns)": 157011839, "Mean latency (ns)": 45263185, "Min duration satisfied": "Yes", "Min latency (ns)": 29046462, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 22.07, "QPS w/o loadgen overhead": 22.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 104.48653, "characteristics.90th_percentile_latency_ns": 104486530.0, "characteristics.90th_percentile_latency_s": 0.10448653, "characteristics.90th_percentile_latency_us": 104486.53, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.5185, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "2184a528397f0cfd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40567550, "90.00 percentile latency (ns)": 136545072, "90th percentile latency (ns)": 136545072, "95.00 percentile latency (ns)": 193013373, "97.00 percentile latency (ns)": 202012504, "99.00 percentile latency (ns)": 210668304, "99.90 percentile latency (ns)": 220430705, "Max latency (ns)": 227976863, "Mean latency (ns)": 61607395, "Min duration satisfied": "Yes", "Min latency (ns)": 37231459, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.23, "QPS w/o loadgen overhead": 16.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 136.545072, "characteristics.90th_percentile_latency_ns": 136545072.0, "characteristics.90th_percentile_latency_s": 0.136545072, "characteristics.90th_percentile_latency_us": 136545.072, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.2857, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "ffdf44c3a89679e8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 324260412, "90.00 percentile latency (ns)": 416209128, "90th percentile latency (ns)": 416209128, "95.00 percentile latency (ns)": 433856470, "97.00 percentile latency (ns)": 440011178, "99.00 percentile latency (ns)": 455279870, "99.90 percentile latency (ns)": 473264667, "Max latency (ns)": 476895076, "Mean latency (ns)": 305669961, "Min duration satisfied": "Yes", "Min latency (ns)": 178695293, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.27, "QPS w/o loadgen overhead": 3.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 416.209128, "characteristics.90th_percentile_latency_ns": 416209128.0, "characteristics.90th_percentile_latency_s": 0.416209128, "characteristics.90th_percentile_latency_us": 416209.128, "characteristics.accuracy": 78.514, "characteristics.good": 39257, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.3557, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "bdf467480c1f41a4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13528391, "90.00 percentile latency (ns)": 19582815, "90th percentile latency (ns)": 19582815, "95.00 percentile latency (ns)": 35533208, "97.00 percentile latency (ns)": 54296231, "99.00 percentile latency (ns)": 149126253, "99.90 percentile latency (ns)": 185098806, "Max latency (ns)": 202497228, "Mean latency (ns)": 18015005, "Min duration satisfied": "Yes", "Min latency (ns)": 13010682, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 55.37, "QPS w/o loadgen overhead": 55.51, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.582815, "characteristics.90th_percentile_latency_ns": 19582815.0, "characteristics.90th_percentile_latency_s": 0.019582815, "characteristics.90th_percentile_latency_us": 19582.815, "characteristics.accuracy": 63.542, "characteristics.good": 31771, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "1b6bfb13e4dc98a3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10213005, "90.00 percentile latency (ns)": 71072321, "90th percentile latency (ns)": 71072321, "95.00 percentile latency (ns)": 122850958, "97.00 percentile latency (ns)": 149072712, "99.00 percentile latency (ns)": 165629398, "99.90 percentile latency (ns)": 178656305, "Max latency (ns)": 204399481, "Mean latency (ns)": 24784573, "Min duration satisfied": "Yes", "Min latency (ns)": 8405253, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 40.28, "QPS w/o loadgen overhead": 40.35, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 71.072321, "characteristics.90th_percentile_latency_ns": 71072321.0, "characteristics.90th_percentile_latency_s": 0.071072321, "characteristics.90th_percentile_latency_us": 71072.321, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "44b3846c0750b0aa", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19576646, "90.00 percentile latency (ns)": 152375822, "90th percentile latency (ns)": 152375822, "95.00 percentile latency (ns)": 168325695, "97.00 percentile latency (ns)": 173458124, "99.00 percentile latency (ns)": 180401950, "99.90 percentile latency (ns)": 193479425, "Max latency (ns)": 207864628, "Mean latency (ns)": 50274458, "Min duration satisfied": "Yes", "Min latency (ns)": 10450992, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.87, "QPS w/o loadgen overhead": 19.89, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 152.375822, "characteristics.90th_percentile_latency_ns": 152375822.0, "characteristics.90th_percentile_latency_s": 0.152375822, "characteristics.90th_percentile_latency_us": 152375.822, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.3934, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "17871704d54a01b6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21261351, "90.00 percentile latency (ns)": 118634059, "90th percentile latency (ns)": 118634059, "95.00 percentile latency (ns)": 172336421, "97.00 percentile latency (ns)": 180496403, "99.00 percentile latency (ns)": 188827033, "99.90 percentile latency (ns)": 199542401, "Max latency (ns)": 209096039, "Mean latency (ns)": 42982582, "Min duration satisfied": "Yes", "Min latency (ns)": 19823441, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.25, "QPS w/o loadgen overhead": 23.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 118.634059, "characteristics.90th_percentile_latency_ns": 118634059.0, "characteristics.90th_percentile_latency_s": 0.118634059, "characteristics.90th_percentile_latency_us": 118634.059, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.873, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "44f12afaab8fc416", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4947540, "90.00 percentile latency (ns)": 5219082, "90th percentile latency (ns)": 5219082, "95.00 percentile latency (ns)": 6182164, "97.00 percentile latency (ns)": 7044331, "99.00 percentile latency (ns)": 29754655, "99.90 percentile latency (ns)": 92626258, "Max latency (ns)": 107109913, "Mean latency (ns)": 5504405, "Min duration satisfied": "Yes", "Min latency (ns)": 3904832, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 180.71, "QPS w/o loadgen overhead": 181.67, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.219082, "characteristics.90th_percentile_latency_ns": 5219082.0, "characteristics.90th_percentile_latency_s": 0.005219082, "characteristics.90th_percentile_latency_us": 5219.082, "characteristics.accuracy": 48.162, "characteristics.good": 24081, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "b114674a8b4261ac", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 74152147, "90.00 percentile latency (ns)": 149194463, "90th percentile latency (ns)": 149194463, "95.00 percentile latency (ns)": 196076656, "97.00 percentile latency (ns)": 205041062, "99.00 percentile latency (ns)": 214697846, "99.90 percentile latency (ns)": 223914862, "Max latency (ns)": 228916589, "Mean latency (ns)": 87843985, "Min duration satisfied": "Yes", "Min latency (ns)": 63649237, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 11.38, "QPS w/o loadgen overhead": 11.38, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 149.194463, "characteristics.90th_percentile_latency_ns": 149194463.0, "characteristics.90th_percentile_latency_s": 0.149194463, "characteristics.90th_percentile_latency_us": 149194.463, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.8696, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "a4cec8fc1293ee28", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5445188, "90.00 percentile latency (ns)": 6685614, "90th percentile latency (ns)": 6685614, "95.00 percentile latency (ns)": 9236543, "97.00 percentile latency (ns)": 22088027, "99.00 percentile latency (ns)": 80195437, "99.90 percentile latency (ns)": 98101453, "Max latency (ns)": 110506728, "Mean latency (ns)": 7363468, "Min duration satisfied": "Yes", "Min latency (ns)": 4988116, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 135.23, "QPS w/o loadgen overhead": 135.81, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.685614, "characteristics.90th_percentile_latency_ns": 6685614.0, "characteristics.90th_percentile_latency_s": 0.006685614, "characteristics.90th_percentile_latency_us": 6685.614, "characteristics.accuracy": 50.242, "characteristics.good": 25121, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d8540eca3f1a1e95", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19889070, "90.00 percentile latency (ns)": 100591482, "90th percentile latency (ns)": 100591482, "95.00 percentile latency (ns)": 104656294, "97.00 percentile latency (ns)": 106799125, "99.00 percentile latency (ns)": 110147798, "99.90 percentile latency (ns)": 116380992, "Max latency (ns)": 121208672, "Mean latency (ns)": 40383670, "Min duration satisfied": "Yes", "Min latency (ns)": 12801268, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 24.73, "QPS w/o loadgen overhead": 24.76, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 100.591482, "characteristics.90th_percentile_latency_ns": 100591482.0, "characteristics.90th_percentile_latency_s": 0.100591482, "characteristics.90th_percentile_latency_us": 100591.482, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.8679, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "7849024f66b83abe", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29477284, "90.00 percentile latency (ns)": 112832957, "90th percentile latency (ns)": 112832957, "95.00 percentile latency (ns)": 179696685, "97.00 percentile latency (ns)": 192010920, "99.00 percentile latency (ns)": 202799284, "99.90 percentile latency (ns)": 211760180, "Max latency (ns)": 218109470, "Mean latency (ns)": 49641921, "Min duration satisfied": "Yes", "Min latency (ns)": 28520618, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.13, "QPS w/o loadgen overhead": 20.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 112.832957, "characteristics.90th_percentile_latency_ns": 112832957.0, "characteristics.90th_percentile_latency_s": 0.112832957, "characteristics.90th_percentile_latency_us": 112832.957, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20.4082, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "67b9c38f7e5ffc7f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 58536162, "90.00 percentile latency (ns)": 100737892, "90th percentile latency (ns)": 100737892, "95.00 percentile latency (ns)": 168624029, "97.00 percentile latency (ns)": 212149782, "99.00 percentile latency (ns)": 242464318, "99.90 percentile latency (ns)": 265273246, "Max latency (ns)": 282413735, "Mean latency (ns)": 72438353, "Min duration satisfied": "Yes", "Min latency (ns)": 53482196, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.8, "QPS w/o loadgen overhead": 13.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 100.737892, "characteristics.90th_percentile_latency_ns": 100737892.0, "characteristics.90th_percentile_latency_s": 0.100737892, "characteristics.90th_percentile_latency_us": 100737.892, "characteristics.accuracy": 74.098, "characteristics.good": 37049, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.987, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "72ba12410ebf80f0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11609135, "90.00 percentile latency (ns)": 13368499, "90th percentile latency (ns)": 13368499, "95.00 percentile latency (ns)": 22314571, "97.00 percentile latency (ns)": 33863360, "99.00 percentile latency (ns)": 97990265, "99.90 percentile latency (ns)": 182462430, "Max latency (ns)": 202069877, "Mean latency (ns)": 13921083, "Min duration satisfied": "Yes", "Min latency (ns)": 10051966, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 71.65, "QPS w/o loadgen overhead": 71.83, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.368499, "characteristics.90th_percentile_latency_ns": 13368499.0, "characteristics.90th_percentile_latency_s": 0.013368499, "characteristics.90th_percentile_latency_us": 13368.499, "characteristics.accuracy": 61.924, "characteristics.good": 30962, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "9159703f47d22912", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10826962, "90.00 percentile latency (ns)": 16691362, "90th percentile latency (ns)": 16691362, "95.00 percentile latency (ns)": 34728431, "97.00 percentile latency (ns)": 75910651, "99.00 percentile latency (ns)": 102874204, "99.90 percentile latency (ns)": 112973233, "Max latency (ns)": 122977561, "Mean latency (ns)": 15088005, "Min duration satisfied": "Yes", "Min latency (ns)": 10338047, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 66.03, "QPS w/o loadgen overhead": 66.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.691362, "characteristics.90th_percentile_latency_ns": 16691362.0, "characteristics.90th_percentile_latency_s": 0.016691362, "characteristics.90th_percentile_latency_us": 16691.362, "characteristics.accuracy": 62.298, "characteristics.good": 31149, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "5a35ae86e81e2a8e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5205994, "90.00 percentile latency (ns)": 5548734, "90th percentile latency (ns)": 5548734, "95.00 percentile latency (ns)": 6875236, "97.00 percentile latency (ns)": 7661844, "99.00 percentile latency (ns)": 27438555, "99.90 percentile latency (ns)": 139583853, "Max latency (ns)": 189544897, "Mean latency (ns)": 5910820, "Min duration satisfied": "Yes", "Min latency (ns)": 4503670, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 168.24, "QPS w/o loadgen overhead": 169.18, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.548734, "characteristics.90th_percentile_latency_ns": 5548734.0, "characteristics.90th_percentile_latency_s": 0.005548734, "characteristics.90th_percentile_latency_us": 5548.734, "characteristics.accuracy": 49.12, "characteristics.good": 24560, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "82494c306f7518b9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40968398, "90.00 percentile latency (ns)": 69597610, "90th percentile latency (ns)": 69597610, "95.00 percentile latency (ns)": 123156810, "97.00 percentile latency (ns)": 173083050, "99.00 percentile latency (ns)": 210164310, "99.90 percentile latency (ns)": 229219462, "Max latency (ns)": 254823430, "Mean latency (ns)": 52952633, "Min duration satisfied": "Yes", "Min latency (ns)": 39743381, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.87, "QPS w/o loadgen overhead": 18.88, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 69.59761, "characteristics.90th_percentile_latency_ns": 69597610.0, "characteristics.90th_percentile_latency_s": 0.06959761, "characteristics.90th_percentile_latency_us": 69597.61, "characteristics.accuracy": 73.584, "characteristics.good": 36792, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.1818, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d4a4477f916d7e46", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29471510, "90.00 percentile latency (ns)": 59180448, "90th percentile latency (ns)": 59180448, "95.00 percentile latency (ns)": 111633316, "97.00 percentile latency (ns)": 120648137, "99.00 percentile latency (ns)": 127563838, "99.90 percentile latency (ns)": 138155778, "Max latency (ns)": 144373010, "Mean latency (ns)": 38957607, "Min duration satisfied": "Yes", "Min latency (ns)": 28517759, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 25.62, "QPS w/o loadgen overhead": 25.67, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 59.180448, "characteristics.90th_percentile_latency_ns": 59180448.0, "characteristics.90th_percentile_latency_s": 0.059180448, "characteristics.90th_percentile_latency_us": 59180.448, "characteristics.accuracy": 70.772, "characteristics.good": 35386, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 24.3902, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "8ba26f7190e90ce6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10213590, "90.00 percentile latency (ns)": 78457510, "90th percentile latency (ns)": 78457510, "95.00 percentile latency (ns)": 87635098, "97.00 percentile latency (ns)": 90668724, "99.00 percentile latency (ns)": 95825396, "99.90 percentile latency (ns)": 103955319, "Max latency (ns)": 116438366, "Mean latency (ns)": 25448126, "Min duration satisfied": "Yes", "Min latency (ns)": 6526921, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 39.2, "QPS w/o loadgen overhead": 39.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 78.45751, "characteristics.90th_percentile_latency_ns": 78457510.0, "characteristics.90th_percentile_latency_s": 0.07845751, "characteristics.90th_percentile_latency_us": 78457.51, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "81559b02b38a4b82", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28009350, "90.00 percentile latency (ns)": 163724531, "90th percentile latency (ns)": 163724531, "95.00 percentile latency (ns)": 176483828, "97.00 percentile latency (ns)": 181654451, "99.00 percentile latency (ns)": 188445082, "99.90 percentile latency (ns)": 197133799, "Max latency (ns)": 204222224, "Mean latency (ns)": 58102036, "Min duration satisfied": "Yes", "Min latency (ns)": 16093297, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.2, "QPS w/o loadgen overhead": 17.21, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 163.724531, "characteristics.90th_percentile_latency_ns": 163724531.0, "characteristics.90th_percentile_latency_s": 0.163724531, "characteristics.90th_percentile_latency_us": 163724.531, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.5, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "b9eae56d6938f8b5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15285732, "90.00 percentile latency (ns)": 66472346, "90th percentile latency (ns)": 66472346, "95.00 percentile latency (ns)": 90631699, "97.00 percentile latency (ns)": 95329269, "99.00 percentile latency (ns)": 100950435, "99.90 percentile latency (ns)": 110517228, "Max latency (ns)": 127731957, "Mean latency (ns)": 26353731, "Min duration satisfied": "Yes", "Min latency (ns)": 11648032, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 37.88, "QPS w/o loadgen overhead": 37.95, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 66.472346, "characteristics.90th_percentile_latency_ns": 66472346.0, "characteristics.90th_percentile_latency_s": 0.066472346, "characteristics.90th_percentile_latency_us": 66472.346, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "2c482a9e5492de0f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8706610, "90.00 percentile latency (ns)": 9571626, "90th percentile latency (ns)": 9571626, "95.00 percentile latency (ns)": 11733853, "97.00 percentile latency (ns)": 20562377, "99.00 percentile latency (ns)": 50446793, "99.90 percentile latency (ns)": 172257479, "Max latency (ns)": 196912385, "Mean latency (ns)": 10222979, "Min duration satisfied": "Yes", "Min latency (ns)": 7546065, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 97.51, "QPS w/o loadgen overhead": 97.82, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.571626, "characteristics.90th_percentile_latency_ns": 9571626.0, "characteristics.90th_percentile_latency_s": 0.009571626, "characteristics.90th_percentile_latency_us": 9571.626, "characteristics.accuracy": 59.226, "characteristics.good": 29613, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "8d983db08fa4cc70", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16706711, "90.00 percentile latency (ns)": 20832059, "90th percentile latency (ns)": 20832059, "95.00 percentile latency (ns)": 34428515, "97.00 percentile latency (ns)": 45665545, "99.00 percentile latency (ns)": 98353047, "99.90 percentile latency (ns)": 116337492, "Max latency (ns)": 134855826, "Mean latency (ns)": 19576610, "Min duration satisfied": "Yes", "Min latency (ns)": 15677421, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 50.99, "QPS w/o loadgen overhead": 51.08, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.832059, "characteristics.90th_percentile_latency_ns": 20832059.0, "characteristics.90th_percentile_latency_s": 0.020832059, "characteristics.90th_percentile_latency_us": 20832.059, "characteristics.accuracy": 68.248, "characteristics.good": 34124, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "0dd76f8948e590a2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7517471, "90.00 percentile latency (ns)": 8377548, "90th percentile latency (ns)": 8377548, "95.00 percentile latency (ns)": 10177424, "97.00 percentile latency (ns)": 16899539, "99.00 percentile latency (ns)": 43189895, "99.90 percentile latency (ns)": 164456911, "Max latency (ns)": 194712795, "Mean latency (ns)": 8889307, "Min duration satisfied": "Yes", "Min latency (ns)": 6826489, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 112.08, "QPS w/o loadgen overhead": 112.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.377548, "characteristics.90th_percentile_latency_ns": 8377548.0, "characteristics.90th_percentile_latency_s": 0.008377548, "characteristics.90th_percentile_latency_us": 8377.548, "characteristics.accuracy": 59.12, "characteristics.good": 29560, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "604d64b071453080", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7930698, "90.00 percentile latency (ns)": 9282319, "90th percentile latency (ns)": 9282319, "95.00 percentile latency (ns)": 11159779, "97.00 percentile latency (ns)": 21056606, "99.00 percentile latency (ns)": 63261785, "99.90 percentile latency (ns)": 103318463, "Max latency (ns)": 117994734, "Mean latency (ns)": 9471033, "Min duration satisfied": "Yes", "Min latency (ns)": 7117856, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 105.2, "QPS w/o loadgen overhead": 105.59, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.282319, "characteristics.90th_percentile_latency_ns": 9282319.0, "characteristics.90th_percentile_latency_s": 0.009282319, "characteristics.90th_percentile_latency_us": 9282.319, "characteristics.accuracy": 58.46, "characteristics.good": 29230, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d4724856b1fa8d7b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28343272, "90.00 percentile latency (ns)": 54925460, "90th percentile latency (ns)": 54925460, "95.00 percentile latency (ns)": 105130884, "97.00 percentile latency (ns)": 156958972, "99.00 percentile latency (ns)": 185274709, "99.90 percentile latency (ns)": 199068777, "Max latency (ns)": 206972320, "Mean latency (ns)": 39074021, "Min duration satisfied": "Yes", "Min latency (ns)": 27387188, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 25.56, "QPS w/o loadgen overhead": 25.59, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 54.92546, "characteristics.90th_percentile_latency_ns": 54925460.0, "characteristics.90th_percentile_latency_s": 0.05492546, "characteristics.90th_percentile_latency_us": 54925.46, "characteristics.accuracy": 72.91, "characteristics.good": 36455, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.027, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "c4fbfa720b58961b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26494628, "90.00 percentile latency (ns)": 49034181, "90th percentile latency (ns)": 49034181, "95.00 percentile latency (ns)": 92485159, "97.00 percentile latency (ns)": 155239706, "99.00 percentile latency (ns)": 194591374, "99.90 percentile latency (ns)": 208654179, "Max latency (ns)": 222012130, "Mean latency (ns)": 36554990, "Min duration satisfied": "Yes", "Min latency (ns)": 25653508, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 27.32, "QPS w/o loadgen overhead": 27.36, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 49.034181, "characteristics.90th_percentile_latency_ns": 49034181.0, "characteristics.90th_percentile_latency_s": 0.049034181, "characteristics.90th_percentile_latency_us": 49034.181, "characteristics.accuracy": 70.542, "characteristics.good": 35271, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25.641, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "2224b4ae9978a9f5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9210561, "90.00 percentile latency (ns)": 10080606, "90th percentile latency (ns)": 10080606, "95.00 percentile latency (ns)": 12425320, "97.00 percentile latency (ns)": 22780588, "99.00 percentile latency (ns)": 65421873, "99.90 percentile latency (ns)": 174927510, "Max latency (ns)": 205106634, "Mean latency (ns)": 10804334, "Min duration satisfied": "Yes", "Min latency (ns)": 7813474, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 92.25, "QPS w/o loadgen overhead": 92.56, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.080606, "characteristics.90th_percentile_latency_ns": 10080606.0, "characteristics.90th_percentile_latency_s": 0.010080606, "characteristics.90th_percentile_latency_us": 10080.606, "characteristics.accuracy": 56.594, "characteristics.good": 28297, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "ffa4f64925db41f8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16382042, "90.00 percentile latency (ns)": 20234668, "90th percentile latency (ns)": 20234668, "95.00 percentile latency (ns)": 35495210, "97.00 percentile latency (ns)": 50017293, "99.00 percentile latency (ns)": 129623381, "99.90 percentile latency (ns)": 191492889, "Max latency (ns)": 209920090, "Mean latency (ns)": 19882047, "Min duration satisfied": "Yes", "Min latency (ns)": 14825709, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 50.19, "QPS w/o loadgen overhead": 50.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.234668, "characteristics.90th_percentile_latency_ns": 20234668.0, "characteristics.90th_percentile_latency_s": 0.020234668, "characteristics.90th_percentile_latency_us": 20234.668, "characteristics.accuracy": 67.82, "characteristics.good": 33910, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "f84acf81bd9ac13b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4868214, "90.00 percentile latency (ns)": 35494840, "90th percentile latency (ns)": 35494840, "95.00 percentile latency (ns)": 64486175, "97.00 percentile latency (ns)": 76170783, "99.00 percentile latency (ns)": 85462701, "99.90 percentile latency (ns)": 96201139, "Max latency (ns)": 108830150, "Mean latency (ns)": 12620822, "Min duration satisfied": "Yes", "Min latency (ns)": 4572172, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 78.93, "QPS w/o loadgen overhead": 79.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 35.49484, "characteristics.90th_percentile_latency_ns": 35494840.0, "characteristics.90th_percentile_latency_s": 0.03549484, "characteristics.90th_percentile_latency_us": 35494.84, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "6b4e2cb9a50b436c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3958506, "90.00 percentile latency (ns)": 4203799, "90th percentile latency (ns)": 4203799, "95.00 percentile latency (ns)": 5117884, "97.00 percentile latency (ns)": 5860760, "99.00 percentile latency (ns)": 20880161, "99.90 percentile latency (ns)": 82237296, "Max latency (ns)": 105842499, "Mean latency (ns)": 4395911, "Min duration satisfied": "Yes", "Min latency (ns)": 3143880, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 225.98, "QPS w/o loadgen overhead": 227.48, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.203799, "characteristics.90th_percentile_latency_ns": 4203799.0, "characteristics.90th_percentile_latency_s": 0.004203799, "characteristics.90th_percentile_latency_us": 4203.799, "characteristics.accuracy": 45.494, "characteristics.good": 22747, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "49b39497dacfd6d7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 47220940, "90.00 percentile latency (ns)": 99206589, "90th percentile latency (ns)": 99206589, "95.00 percentile latency (ns)": 130194464, "97.00 percentile latency (ns)": 136852304, "99.00 percentile latency (ns)": 146423124, "99.90 percentile latency (ns)": 156444489, "Max latency (ns)": 168851599, "Mean latency (ns)": 59568211, "Min duration satisfied": "Yes", "Min latency (ns)": 44499111, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.78, "QPS w/o loadgen overhead": 16.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 99.206589, "characteristics.90th_percentile_latency_ns": 99206589.0, "characteristics.90th_percentile_latency_s": 0.099206589, "characteristics.90th_percentile_latency_us": 99206.589, "characteristics.accuracy": 70.626, "characteristics.good": 35313, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.625, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "77fc07979c1b4ca0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11149264, "90.00 percentile latency (ns)": 13011557, "90th percentile latency (ns)": 13011557, "95.00 percentile latency (ns)": 21248080, "97.00 percentile latency (ns)": 30889896, "99.00 percentile latency (ns)": 76446098, "99.90 percentile latency (ns)": 178062297, "Max latency (ns)": 198543587, "Mean latency (ns)": 13432322, "Min duration satisfied": "Yes", "Min latency (ns)": 10083519, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 74.25, "QPS w/o loadgen overhead": 74.45, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.011557, "characteristics.90th_percentile_latency_ns": 13011557.0, "characteristics.90th_percentile_latency_s": 0.013011557, "characteristics.90th_percentile_latency_us": 13011.557, "characteristics.accuracy": 63.454, "characteristics.good": 31727, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "1423c9f5918502da", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22883863, "90.00 percentile latency (ns)": 31358527, "90th percentile latency (ns)": 31358527, "95.00 percentile latency (ns)": 46005227, "97.00 percentile latency (ns)": 62535262, "99.00 percentile latency (ns)": 112243495, "99.90 percentile latency (ns)": 125623398, "Max latency (ns)": 135226530, "Mean latency (ns)": 26546330, "Min duration satisfied": "Yes", "Min latency (ns)": 21253238, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 37.61, "QPS w/o loadgen overhead": 37.67, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 31.358527, "characteristics.90th_percentile_latency_ns": 31358527.0, "characteristics.90th_percentile_latency_s": 0.031358527, "characteristics.90th_percentile_latency_us": 31358.527, "characteristics.accuracy": 70.04, "characteristics.good": 35020, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "1ed9aa8cf84e2c95", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 82084321, "90.00 percentile latency (ns)": 218946291, "90th percentile latency (ns)": 218946291, "95.00 percentile latency (ns)": 240552618, "97.00 percentile latency (ns)": 253173361, "99.00 percentile latency (ns)": 264615158, "99.90 percentile latency (ns)": 280148174, "Max latency (ns)": 299587688, "Mean latency (ns)": 115944873, "Min duration satisfied": "Yes", "Min latency (ns)": 71941036, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 8.62, "QPS w/o loadgen overhead": 8.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 218.946291, "characteristics.90th_percentile_latency_ns": 218946291.0, "characteristics.90th_percentile_latency_s": 0.218946291, "characteristics.90th_percentile_latency_us": 218946.291, "characteristics.accuracy": 74.124, "characteristics.good": 37062, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 9.25926, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "62ea425f956ab57b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6887138, "90.00 percentile latency (ns)": 7588599, "90th percentile latency (ns)": 7588599, "95.00 percentile latency (ns)": 9032935, "97.00 percentile latency (ns)": 13319692, "99.00 percentile latency (ns)": 45967515, "99.90 percentile latency (ns)": 99540194, "Max latency (ns)": 111103213, "Mean latency (ns)": 8016714, "Min duration satisfied": "Yes", "Min latency (ns)": 6044803, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 124.25, "QPS w/o loadgen overhead": 124.74, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.588599, "characteristics.90th_percentile_latency_ns": 7588599.0, "characteristics.90th_percentile_latency_s": 0.007588599, "characteristics.90th_percentile_latency_us": 7588.599, "characteristics.accuracy": 59.444, "characteristics.good": 29722, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "ce620fd1242aaa45", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8911875, "90.00 percentile latency (ns)": 9939708, "90th percentile latency (ns)": 9939708, "95.00 percentile latency (ns)": 12300745, "97.00 percentile latency (ns)": 22090457, "99.00 percentile latency (ns)": 63948113, "99.90 percentile latency (ns)": 103096118, "Max latency (ns)": 117359647, "Mean latency (ns)": 10254123, "Min duration satisfied": "Yes", "Min latency (ns)": 7831250, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 97.22, "QPS w/o loadgen overhead": 97.52, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.939708, "characteristics.90th_percentile_latency_ns": 9939708.0, "characteristics.90th_percentile_latency_s": 0.009939708, "characteristics.90th_percentile_latency_us": 9939.708, "characteristics.accuracy": 61.456, "characteristics.good": 30728, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "94b0587162ee22ec", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10464424, "90.00 percentile latency (ns)": 13550840, "90th percentile latency (ns)": 13550840, "95.00 percentile latency (ns)": 24924679, "97.00 percentile latency (ns)": 39612849, "99.00 percentile latency (ns)": 144004531, "99.90 percentile latency (ns)": 182001982, "Max latency (ns)": 197312885, "Mean latency (ns)": 14159493, "Min duration satisfied": "Yes", "Min latency (ns)": 10007963, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 70.41, "QPS w/o loadgen overhead": 70.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.55084, "characteristics.90th_percentile_latency_ns": 13550840.0, "characteristics.90th_percentile_latency_s": 0.01355084, "characteristics.90th_percentile_latency_us": 13550.84, "characteristics.accuracy": 58.528, "characteristics.good": 29264, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "af5fc9f79f4323b7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26512340, "90.00 percentile latency (ns)": 169755088, "90th percentile latency (ns)": 169755088, "95.00 percentile latency (ns)": 183360654, "97.00 percentile latency (ns)": 188454435, "99.00 percentile latency (ns)": 195369950, "99.90 percentile latency (ns)": 205849329, "Max latency (ns)": 216695538, "Mean latency (ns)": 58189980, "Min duration satisfied": "Yes", "Min latency (ns)": 19906298, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.17, "QPS w/o loadgen overhead": 17.19, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 169.755088, "characteristics.90th_percentile_latency_ns": 169755088.0, "characteristics.90th_percentile_latency_s": 0.169755088, "characteristics.90th_percentile_latency_us": 169755.088, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.1515, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "4c7e94927a647a7e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 106646431, "90.00 percentile latency (ns)": 188719818, "90th percentile latency (ns)": 188719818, "95.00 percentile latency (ns)": 251657516, "97.00 percentile latency (ns)": 269446840, "99.00 percentile latency (ns)": 285280972, "99.90 percentile latency (ns)": 298914223, "Max latency (ns)": 318689039, "Mean latency (ns)": 122777928, "Min duration satisfied": "Yes", "Min latency (ns)": 92435266, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 8.14, "QPS w/o loadgen overhead": 8.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 188.719818, "characteristics.90th_percentile_latency_ns": 188719818.0, "characteristics.90th_percentile_latency_s": 0.188719818, "characteristics.90th_percentile_latency_us": 188719.818, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.69231, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "99fdb46e14443bf2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21975023, "90.00 percentile latency (ns)": 29024868, "90th percentile latency (ns)": 29024868, "95.00 percentile latency (ns)": 44865639, "97.00 percentile latency (ns)": 61585670, "99.00 percentile latency (ns)": 148401649, "99.90 percentile latency (ns)": 196581733, "Max latency (ns)": 219009179, "Mean latency (ns)": 25987340, "Min duration satisfied": "Yes", "Min latency (ns)": 19767113, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 38.42, "QPS w/o loadgen overhead": 38.48, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.024868, "characteristics.90th_percentile_latency_ns": 29024868.0, "characteristics.90th_percentile_latency_s": 0.029024868, "characteristics.90th_percentile_latency_us": 29024.868, "characteristics.accuracy": 69.604, "characteristics.good": 34802, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 35.7143, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "674fd681f4a68a88", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 42093860, "90.00 percentile latency (ns)": 103966946, "90th percentile latency (ns)": 103966946, "95.00 percentile latency (ns)": 126031913, "97.00 percentile latency (ns)": 130761700, "99.00 percentile latency (ns)": 137410859, "99.90 percentile latency (ns)": 147584181, "Max latency (ns)": 153754085, "Mean latency (ns)": 55490086, "Min duration satisfied": "Yes", "Min latency (ns)": 39601280, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.01, "QPS w/o loadgen overhead": 18.02, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 103.966946, "characteristics.90th_percentile_latency_ns": 103966946.0, "characteristics.90th_percentile_latency_s": 0.103966946, "characteristics.90th_percentile_latency_us": 103966.946, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.129, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "af8cb3f40eda73c7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21574324, "90.00 percentile latency (ns)": 36915725, "90th percentile latency (ns)": 36915725, "95.00 percentile latency (ns)": 57276216, "97.00 percentile latency (ns)": 108585630, "99.00 percentile latency (ns)": 179276399, "99.90 percentile latency (ns)": 198989599, "Max latency (ns)": 215087503, "Mean latency (ns)": 28822997, "Min duration satisfied": "Yes", "Min latency (ns)": 20932366, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.64, "QPS w/o loadgen overhead": 34.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 36.915725, "characteristics.90th_percentile_latency_ns": 36915725.0, "characteristics.90th_percentile_latency_s": 0.036915725, "characteristics.90th_percentile_latency_us": 36915.725, "characteristics.accuracy": 68.734, "characteristics.good": 34367, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.7778, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "90f17a443db9f1c0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22166363, "90.00 percentile latency (ns)": 118090833, "90th percentile latency (ns)": 118090833, "95.00 percentile latency (ns)": 125432297, "97.00 percentile latency (ns)": 128582941, "99.00 percentile latency (ns)": 133061336, "99.90 percentile latency (ns)": 141411892, "Max latency (ns)": 151787647, "Mean latency (ns)": 43672034, "Min duration satisfied": "Yes", "Min latency (ns)": 15316868, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 22.88, "QPS w/o loadgen overhead": 22.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 118.090833, "characteristics.90th_percentile_latency_ns": 118090833.0, "characteristics.90th_percentile_latency_s": 0.118090833, "characteristics.90th_percentile_latency_us": 118090.833, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.1515, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "57588e5031dbf7d7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10253257, "90.00 percentile latency (ns)": 78455495, "90th percentile latency (ns)": 78455495, "95.00 percentile latency (ns)": 93172117, "97.00 percentile latency (ns)": 96517047, "99.00 percentile latency (ns)": 101052684, "99.90 percentile latency (ns)": 108020001, "Max latency (ns)": 115166725, "Mean latency (ns)": 23420636, "Min duration satisfied": "Yes", "Min latency (ns)": 8704214, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 42.58, "QPS w/o loadgen overhead": 42.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 78.455495, "characteristics.90th_percentile_latency_ns": 78455495.0, "characteristics.90th_percentile_latency_s": 0.078455495, "characteristics.90th_percentile_latency_us": 78455.495, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d198f7f75a43c183", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 67113534, "90.00 percentile latency (ns)": 112243387, "90th percentile latency (ns)": 112243387, "95.00 percentile latency (ns)": 140090271, "97.00 percentile latency (ns)": 147007330, "99.00 percentile latency (ns)": 154845317, "99.90 percentile latency (ns)": 164764637, "Max latency (ns)": 173258843, "Mean latency (ns)": 75139987, "Min duration satisfied": "Yes", "Min latency (ns)": 58561334, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.3, "QPS w/o loadgen overhead": 13.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 112.243387, "characteristics.90th_percentile_latency_ns": 112243387.0, "characteristics.90th_percentile_latency_s": 0.112243387, "characteristics.90th_percentile_latency_us": 112243.387, "characteristics.accuracy": 71.676, "characteristics.good": 35838, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.987, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "846cdb136e37b408", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3665669, "90.00 percentile latency (ns)": 3910669, "90th percentile latency (ns)": 3910669, "95.00 percentile latency (ns)": 4677169, "97.00 percentile latency (ns)": 5617795, "99.00 percentile latency (ns)": 18406510, "99.90 percentile latency (ns)": 106049478, "Max latency (ns)": 168409023, "Mean latency (ns)": 4138556, "Min duration satisfied": "Yes", "Min latency (ns)": 3153794, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 239.27, "QPS w/o loadgen overhead": 241.63, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.910669, "characteristics.90th_percentile_latency_ns": 3910669.0, "characteristics.90th_percentile_latency_s": 0.003910669, "characteristics.90th_percentile_latency_us": 3910.669, "characteristics.accuracy": 43.468, "characteristics.good": 21734, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "48a4ca88d5a15e47", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 493166225, "90.00 percentile latency (ns)": 545062465, "90th percentile latency (ns)": 545062465, "95.00 percentile latency (ns)": 558331316, "97.00 percentile latency (ns)": 563402405, "99.00 percentile latency (ns)": 578899309, "99.90 percentile latency (ns)": 603919584, "Max latency (ns)": 606813127, "Mean latency (ns)": 486407759, "Min duration satisfied": "Yes", "Min latency (ns)": 317799355, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.06, "QPS w/o loadgen overhead": 2.06, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 545.062465, "characteristics.90th_percentile_latency_ns": 545062465.0, "characteristics.90th_percentile_latency_s": 0.545062465, "characteristics.90th_percentile_latency_us": 545062.465, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.04082, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "237952b68714db67", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20320465, "90.00 percentile latency (ns)": 37608561, "90th percentile latency (ns)": 37608561, "95.00 percentile latency (ns)": 62329245, "97.00 percentile latency (ns)": 113245349, "99.00 percentile latency (ns)": 171833717, "99.90 percentile latency (ns)": 186307213, "Max latency (ns)": 204630543, "Mean latency (ns)": 27927407, "Min duration satisfied": "Yes", "Min latency (ns)": 19294991, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 35.75, "QPS w/o loadgen overhead": 35.81, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 37.608561, "characteristics.90th_percentile_latency_ns": 37608561.0, "characteristics.90th_percentile_latency_s": 0.037608561, "characteristics.90th_percentile_latency_us": 37608.561, "characteristics.accuracy": 70.43, "characteristics.good": 35215, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 31.25, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "53700d4b759939b5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 17615222, "90.00 percentile latency (ns)": 22136642, "90th percentile latency (ns)": 22136642, "95.00 percentile latency (ns)": 38915758, "97.00 percentile latency (ns)": 56554938, "99.00 percentile latency (ns)": 152838474, "99.90 percentile latency (ns)": 195292286, "Max latency (ns)": 207265853, "Mean latency (ns)": 21510970, "Min duration satisfied": "Yes", "Min latency (ns)": 15719395, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 46.39, "QPS w/o loadgen overhead": 46.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.136642, "characteristics.90th_percentile_latency_ns": 22136642.0, "characteristics.90th_percentile_latency_s": 0.022136642, "characteristics.90th_percentile_latency_us": 22136.642, "characteristics.accuracy": 67.474, "characteristics.good": 33737, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "0f3fbd4a6bacd801", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14653339, "90.00 percentile latency (ns)": 18213715, "90th percentile latency (ns)": 18213715, "95.00 percentile latency (ns)": 32555846, "97.00 percentile latency (ns)": 44771434, "99.00 percentile latency (ns)": 99529581, "99.90 percentile latency (ns)": 116789545, "Max latency (ns)": 137581845, "Mean latency (ns)": 17458367, "Min duration satisfied": "Yes", "Min latency (ns)": 13464214, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.15, "QPS w/o loadgen overhead": 57.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.213715, "characteristics.90th_percentile_latency_ns": 18213715.0, "characteristics.90th_percentile_latency_s": 0.018213715, "characteristics.90th_percentile_latency_us": 18213.715, "characteristics.accuracy": 67.24, "characteristics.good": 33620, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "6f3e1e50f88419ea", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29050615, "90.00 percentile latency (ns)": 111500635, "90th percentile latency (ns)": 111500635, "95.00 percentile latency (ns)": 116039769, "97.00 percentile latency (ns)": 118585473, "99.00 percentile latency (ns)": 124206417, "99.90 percentile latency (ns)": 132168918, "Max latency (ns)": 141832409, "Mean latency (ns)": 48846160, "Min duration satisfied": "Yes", "Min latency (ns)": 22974915, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.45, "QPS w/o loadgen overhead": 20.47, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 111.500635, "characteristics.90th_percentile_latency_ns": 111500635.0, "characteristics.90th_percentile_latency_s": 0.111500635, "characteristics.90th_percentile_latency_us": 111500.635, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.6582, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "8782bb391a0245b6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 24845427, "90.00 percentile latency (ns)": 106397406, "90th percentile latency (ns)": 106397406, "95.00 percentile latency (ns)": 110835831, "97.00 percentile latency (ns)": 113210040, "99.00 percentile latency (ns)": 118383452, "99.90 percentile latency (ns)": 126807003, "Max latency (ns)": 133033629, "Mean latency (ns)": 46232417, "Min duration satisfied": "Yes", "Min latency (ns)": 16990535, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.6, "QPS w/o loadgen overhead": 21.63, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 106.397406, "characteristics.90th_percentile_latency_ns": 106397406.0, "characteristics.90th_percentile_latency_s": 0.106397406, "characteristics.90th_percentile_latency_us": 106397.406, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "e3484cbcede11ef4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20302919, "90.00 percentile latency (ns)": 149681596, "90th percentile latency (ns)": 149681596, "95.00 percentile latency (ns)": 171478140, "97.00 percentile latency (ns)": 177026518, "99.00 percentile latency (ns)": 185637602, "99.90 percentile latency (ns)": 199486606, "Max latency (ns)": 209828482, "Mean latency (ns)": 48166814, "Min duration satisfied": "Yes", "Min latency (ns)": 14214377, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.74, "QPS w/o loadgen overhead": 20.76, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 149.681596, "characteristics.90th_percentile_latency_ns": 149681596.0, "characteristics.90th_percentile_latency_s": 0.149681596, "characteristics.90th_percentile_latency_us": 149681.596, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.9254, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "9a70259e3a467980", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 27680589, "90.00 percentile latency (ns)": 111265732, "90th percentile latency (ns)": 111265732, "95.00 percentile latency (ns)": 116376725, "97.00 percentile latency (ns)": 118541431, "99.00 percentile latency (ns)": 122734634, "99.90 percentile latency (ns)": 131910456, "Max latency (ns)": 170061947, "Mean latency (ns)": 47738250, "Min duration satisfied": "Yes", "Min latency (ns)": 23015678, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.92, "QPS w/o loadgen overhead": 20.95, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 111.265732, "characteristics.90th_percentile_latency_ns": 111265732.0, "characteristics.90th_percentile_latency_s": 0.111265732, "characteristics.90th_percentile_latency_us": 111265.732, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "3b1d456983b01c2b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4536301, "90.00 percentile latency (ns)": 4827087, "90th percentile latency (ns)": 4827087, "95.00 percentile latency (ns)": 5834796, "97.00 percentile latency (ns)": 7165379, "99.00 percentile latency (ns)": 25497262, "99.90 percentile latency (ns)": 129616094, "Max latency (ns)": 177859017, "Mean latency (ns)": 5248003, "Min duration satisfied": "Yes", "Min latency (ns)": 4066717, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 189.23, "QPS w/o loadgen overhead": 190.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.827087, "characteristics.90th_percentile_latency_ns": 4827087.0, "characteristics.90th_percentile_latency_s": 0.004827087, "characteristics.90th_percentile_latency_us": 4827.087, "characteristics.accuracy": 49.11, "characteristics.good": 24555, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d4e7ab62080fb2cd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9345883, "90.00 percentile latency (ns)": 10262592, "90th percentile latency (ns)": 10262592, "95.00 percentile latency (ns)": 13389261, "97.00 percentile latency (ns)": 23671271, "99.00 percentile latency (ns)": 52784919, "99.90 percentile latency (ns)": 169222984, "Max latency (ns)": 190353819, "Mean latency (ns)": 11014115, "Min duration satisfied": "Yes", "Min latency (ns)": 8397382, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 90.52, "QPS w/o loadgen overhead": 90.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.262592, "characteristics.90th_percentile_latency_ns": 10262592.0, "characteristics.90th_percentile_latency_s": 0.010262592, "characteristics.90th_percentile_latency_us": 10262.592, "characteristics.accuracy": 62.07, "characteristics.good": 31035, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "4e699c697cd94048", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22491892, "90.00 percentile latency (ns)": 159527287, "90th percentile latency (ns)": 159527287, "95.00 percentile latency (ns)": 175158210, "97.00 percentile latency (ns)": 180113523, "99.00 percentile latency (ns)": 186679424, "99.90 percentile latency (ns)": 196358300, "Max latency (ns)": 207891714, "Mean latency (ns)": 52277473, "Min duration satisfied": "Yes", "Min latency (ns)": 14357010, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.11, "QPS w/o loadgen overhead": 19.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 159.527287, "characteristics.90th_percentile_latency_ns": 159527287.0, "characteristics.90th_percentile_latency_s": 0.159527287, "characteristics.90th_percentile_latency_us": 159527.287, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.0845, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "355f9b44a692fa68", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2730588, "90.00 percentile latency (ns)": 2926880, "90th percentile latency (ns)": 2926880, "95.00 percentile latency (ns)": 3304880, "97.00 percentile latency (ns)": 4201173, "99.00 percentile latency (ns)": 10234308, "99.90 percentile latency (ns)": 76645992, "Max latency (ns)": 97319692, "Mean latency (ns)": 3024682, "Min duration satisfied": "Yes", "Min latency (ns)": 2192462, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 326.77, "QPS w/o loadgen overhead": 330.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.92688, "characteristics.90th_percentile_latency_ns": 2926880.0, "characteristics.90th_percentile_latency_s": 0.00292688, "characteristics.90th_percentile_latency_us": 2926.88, "characteristics.accuracy": 42.384, "characteristics.good": 21192, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "5171580ff0440396", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 90824085, "90.00 percentile latency (ns)": 214439020, "90th percentile latency (ns)": 214439020, "95.00 percentile latency (ns)": 231803674, "97.00 percentile latency (ns)": 237869912, "99.00 percentile latency (ns)": 246492457, "99.90 percentile latency (ns)": 258797746, "Max latency (ns)": 265246279, "Mean latency (ns)": 115129795, "Min duration satisfied": "Yes", "Min latency (ns)": 75316119, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 8.68, "QPS w/o loadgen overhead": 8.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 214.43902, "characteristics.90th_percentile_latency_ns": 214439020.0, "characteristics.90th_percentile_latency_s": 0.21443902, "characteristics.90th_percentile_latency_us": 214439.02, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.46269, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "7931e41cb42c48bb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12214715, "90.00 percentile latency (ns)": 20767838, "90th percentile latency (ns)": 20767838, "95.00 percentile latency (ns)": 37794467, "97.00 percentile latency (ns)": 75555898, "99.00 percentile latency (ns)": 120644553, "99.90 percentile latency (ns)": 133118886, "Max latency (ns)": 145581929, "Mean latency (ns)": 17070558, "Min duration satisfied": "Yes", "Min latency (ns)": 11446458, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 58.37, "QPS w/o loadgen overhead": 58.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.767838, "characteristics.90th_percentile_latency_ns": 20767838.0, "characteristics.90th_percentile_latency_s": 0.020767838, "characteristics.90th_percentile_latency_us": 20767.838, "characteristics.accuracy": 64.486, "characteristics.good": 32243, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "44f82ad39c9f39cc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 235354940, "90.00 percentile latency (ns)": 293672880, "90th percentile latency (ns)": 293672880, "95.00 percentile latency (ns)": 303602443, "97.00 percentile latency (ns)": 309512456, "99.00 percentile latency (ns)": 317951459, "99.90 percentile latency (ns)": 341667413, "Max latency (ns)": 448119929, "Mean latency (ns)": 226369438, "Min duration satisfied": "Yes", "Min latency (ns)": 123688929, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.42, "QPS w/o loadgen overhead": 4.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 293.67288, "characteristics.90th_percentile_latency_ns": 293672880.0, "characteristics.90th_percentile_latency_s": 0.29367288, "characteristics.90th_percentile_latency_us": 293672.88, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.1841, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "32aa7f02fda0d9e7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4758237, "90.00 percentile latency (ns)": 5070901, "90th percentile latency (ns)": 5070901, "95.00 percentile latency (ns)": 6425106, "97.00 percentile latency (ns)": 7324606, "99.00 percentile latency (ns)": 30748539, "99.90 percentile latency (ns)": 92909809, "Max latency (ns)": 110418255, "Mean latency (ns)": 5556298, "Min duration satisfied": "Yes", "Min latency (ns)": 4188612, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 178.91, "QPS w/o loadgen overhead": 179.98, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.070901, "characteristics.90th_percentile_latency_ns": 5070901.0, "characteristics.90th_percentile_latency_s": 0.005070901, "characteristics.90th_percentile_latency_us": 5070.901, "characteristics.accuracy": 56.75, "characteristics.good": 28375, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "e012c413193d750b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6363308, "90.00 percentile latency (ns)": 6912225, "90th percentile latency (ns)": 6912225, "95.00 percentile latency (ns)": 8768984, "97.00 percentile latency (ns)": 12195198, "99.00 percentile latency (ns)": 35451960, "99.90 percentile latency (ns)": 160676373, "Max latency (ns)": 190830690, "Mean latency (ns)": 7541181, "Min duration satisfied": "Yes", "Min latency (ns)": 5678180, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 131.99, "QPS w/o loadgen overhead": 132.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.912225, "characteristics.90th_percentile_latency_ns": 6912225.0, "characteristics.90th_percentile_latency_s": 0.006912225, "characteristics.90th_percentile_latency_us": 6912.225, "characteristics.accuracy": 57.002, "characteristics.good": 28501, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d44edaf1402a3f31", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 97122266, "90.00 percentile latency (ns)": 224166652, "90th percentile latency (ns)": 224166652, "95.00 percentile latency (ns)": 239890229, "97.00 percentile latency (ns)": 245796986, "99.00 percentile latency (ns)": 254903706, "99.90 percentile latency (ns)": 269859817, "Max latency (ns)": 302025508, "Mean latency (ns)": 122297193, "Min duration satisfied": "Yes", "Min latency (ns)": 80872906, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 8.17, "QPS w/o loadgen overhead": 8.18, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 224.166652, "characteristics.90th_percentile_latency_ns": 224166652.0, "characteristics.90th_percentile_latency_s": 0.224166652, "characteristics.90th_percentile_latency_us": 224166.652, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.8125, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "3a5374dc145f9980", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12780032, "90.00 percentile latency (ns)": 87989630, "90th percentile latency (ns)": 87989630, "95.00 percentile latency (ns)": 128423714, "97.00 percentile latency (ns)": 146326964, "99.00 percentile latency (ns)": 161816515, "99.90 percentile latency (ns)": 175251622, "Max latency (ns)": 221374888, "Mean latency (ns)": 32478406, "Min duration satisfied": "Yes", "Min latency (ns)": 7508101, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 30.74, "QPS w/o loadgen overhead": 30.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 87.98963, "characteristics.90th_percentile_latency_ns": 87989630.0, "characteristics.90th_percentile_latency_s": 0.08798963, "characteristics.90th_percentile_latency_us": 87989.63, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 23.2558, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "34a22d254fbc227d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40724219, "90.00 percentile latency (ns)": 142885348, "90th percentile latency (ns)": 142885348, "95.00 percentile latency (ns)": 178986945, "97.00 percentile latency (ns)": 184916233, "99.00 percentile latency (ns)": 192241144, "99.90 percentile latency (ns)": 203334135, "Max latency (ns)": 211794462, "Mean latency (ns)": 62287004, "Min duration satisfied": "Yes", "Min latency (ns)": 36586638, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.05, "QPS w/o loadgen overhead": 16.05, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 142.885348, "characteristics.90th_percentile_latency_ns": 142885348.0, "characteristics.90th_percentile_latency_s": 0.142885348, "characteristics.90th_percentile_latency_us": 142885.348, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.0482, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "4a64a599ec2ac354", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 32019478, "90.00 percentile latency (ns)": 112981237, "90th percentile latency (ns)": 112981237, "95.00 percentile latency (ns)": 117429446, "97.00 percentile latency (ns)": 119822574, "99.00 percentile latency (ns)": 124209659, "99.90 percentile latency (ns)": 132818665, "Max latency (ns)": 191395578, "Mean latency (ns)": 52205445, "Min duration satisfied": "Yes", "Min latency (ns)": 23986389, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.13, "QPS w/o loadgen overhead": 19.16, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 112.981237, "characteristics.90th_percentile_latency_ns": 112981237.0, "characteristics.90th_percentile_latency_s": 0.112981237, "characteristics.90th_percentile_latency_us": 112981.237, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.873, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "a9ce84ff4e96b502", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 36871071, "90.00 percentile latency (ns)": 109830506, "90th percentile latency (ns)": 109830506, "95.00 percentile latency (ns)": 123202720, "97.00 percentile latency (ns)": 126797048, "99.00 percentile latency (ns)": 133317612, "99.90 percentile latency (ns)": 142310702, "Max latency (ns)": 190740268, "Mean latency (ns)": 52429974, "Min duration satisfied": "Yes", "Min latency (ns)": 34244324, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.06, "QPS w/o loadgen overhead": 19.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 109.830506, "characteristics.90th_percentile_latency_ns": 109830506.0, "characteristics.90th_percentile_latency_s": 0.109830506, "characteristics.90th_percentile_latency_us": 109830.506, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "2ac2fc4e1d108984", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19473532, "90.00 percentile latency (ns)": 144222804, "90th percentile latency (ns)": 144222804, "95.00 percentile latency (ns)": 165272168, "97.00 percentile latency (ns)": 170697082, "99.00 percentile latency (ns)": 178262160, "99.90 percentile latency (ns)": 191207190, "Max latency (ns)": 220197485, "Mean latency (ns)": 46844565, "Min duration satisfied": "Yes", "Min latency (ns)": 11443613, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.33, "QPS w/o loadgen overhead": 21.35, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 144.222804, "characteristics.90th_percentile_latency_ns": 144222804.0, "characteristics.90th_percentile_latency_s": 0.144222804, "characteristics.90th_percentile_latency_us": 144222.804, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.7059, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "aad0cbee40c00ba7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20471162, "90.00 percentile latency (ns)": 90984416, "90th percentile latency (ns)": 90984416, "95.00 percentile latency (ns)": 126942960, "97.00 percentile latency (ns)": 131793943, "99.00 percentile latency (ns)": 137545287, "99.90 percentile latency (ns)": 146154368, "Max latency (ns)": 153606213, "Mean latency (ns)": 34993742, "Min duration satisfied": "Yes", "Min latency (ns)": 19234206, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 28.55, "QPS w/o loadgen overhead": 28.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 90.984416, "characteristics.90th_percentile_latency_ns": 90984416.0, "characteristics.90th_percentile_latency_s": 0.090984416, "characteristics.90th_percentile_latency_us": 90984.416, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 19.6078, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "3ac3d129cc4efb91", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30922372, "90.00 percentile latency (ns)": 100687698, "90th percentile latency (ns)": 100687698, "95.00 percentile latency (ns)": 166090576, "97.00 percentile latency (ns)": 183803355, "99.00 percentile latency (ns)": 195721928, "99.90 percentile latency (ns)": 208600006, "Max latency (ns)": 222734699, "Mean latency (ns)": 49149669, "Min duration satisfied": "Yes", "Min latency (ns)": 29720316, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.33, "QPS w/o loadgen overhead": 20.35, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 100.687698, "characteristics.90th_percentile_latency_ns": 100687698.0, "characteristics.90th_percentile_latency_s": 0.100687698, "characteristics.90th_percentile_latency_us": 100687.698, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.8889, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d8fe094df1870eb2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 37430736, "90.00 percentile latency (ns)": 76605925, "90th percentile latency (ns)": 76605925, "95.00 percentile latency (ns)": 139227907, "97.00 percentile latency (ns)": 168307146, "99.00 percentile latency (ns)": 186914303, "99.90 percentile latency (ns)": 201449122, "Max latency (ns)": 213005614, "Mean latency (ns)": 49984386, "Min duration satisfied": "Yes", "Min latency (ns)": 34854737, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.98, "QPS w/o loadgen overhead": 20.01, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 76.605925, "characteristics.90th_percentile_latency_ns": 76605925.0, "characteristics.90th_percentile_latency_s": 0.076605925, "characteristics.90th_percentile_latency_us": 76605.925, "characteristics.accuracy": 71.19, "characteristics.good": 35595, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.5185, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "86e5694b0b9d2063", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 328586430, "90.00 percentile latency (ns)": 380736463, "90th percentile latency (ns)": 380736463, "95.00 percentile latency (ns)": 390845357, "97.00 percentile latency (ns)": 396542383, "99.00 percentile latency (ns)": 409008172, "99.90 percentile latency (ns)": 430273817, "Max latency (ns)": 436923714, "Mean latency (ns)": 324454976, "Min duration satisfied": "Yes", "Min latency (ns)": 183151052, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.08, "QPS w/o loadgen overhead": 3.08, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 380.736463, "characteristics.90th_percentile_latency_ns": 380736463.0, "characteristics.90th_percentile_latency_s": 0.380736463, "characteristics.90th_percentile_latency_us": 380736.463, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.0581, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "10f1e4614a808101", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20941283, "90.00 percentile latency (ns)": 120124191, "90th percentile latency (ns)": 120124191, "95.00 percentile latency (ns)": 128274408, "97.00 percentile latency (ns)": 131334281, "99.00 percentile latency (ns)": 136386437, "99.90 percentile latency (ns)": 143850135, "Max latency (ns)": 148640802, "Mean latency (ns)": 42570811, "Min duration satisfied": "Yes", "Min latency (ns)": 16920487, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.47, "QPS w/o loadgen overhead": 23.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 120.124191, "characteristics.90th_percentile_latency_ns": 120124191.0, "characteristics.90th_percentile_latency_s": 0.120124191, "characteristics.90th_percentile_latency_us": 120124.191, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.3846, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "289a9b5c326428c4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 115874378, "90.00 percentile latency (ns)": 269592209, "90th percentile latency (ns)": 269592209, "95.00 percentile latency (ns)": 300265842, "97.00 percentile latency (ns)": 312628754, "99.00 percentile latency (ns)": 325390025, "99.90 percentile latency (ns)": 345693816, "Max latency (ns)": 365999025, "Mean latency (ns)": 150988597, "Min duration satisfied": "Yes", "Min latency (ns)": 104186136, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 6.62, "QPS w/o loadgen overhead": 6.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 269.592209, "characteristics.90th_percentile_latency_ns": 269592209.0, "characteristics.90th_percentile_latency_s": 0.269592209, "characteristics.90th_percentile_latency_us": 269592.209, "characteristics.accuracy": 76.344, "characteristics.good": 38172, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 6.09756, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "75c8cbb8351c5a2a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7051358, "90.00 percentile latency (ns)": 7642861, "90th percentile latency (ns)": 7642861, "95.00 percentile latency (ns)": 9089813, "97.00 percentile latency (ns)": 11290455, "99.00 percentile latency (ns)": 36475044, "99.90 percentile latency (ns)": 159079489, "Max latency (ns)": 183746471, "Mean latency (ns)": 8050293, "Min duration satisfied": "Yes", "Min latency (ns)": 6052109, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 123.73, "QPS w/o loadgen overhead": 124.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.642861, "characteristics.90th_percentile_latency_ns": 7642861.0, "characteristics.90th_percentile_latency_s": 0.007642861, "characteristics.90th_percentile_latency_us": 7642.861, "characteristics.accuracy": 54.568, "characteristics.good": 27284, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "c9d42dfbe4df6807", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9956947, "90.00 percentile latency (ns)": 22275246, "90th percentile latency (ns)": 22275246, "95.00 percentile latency (ns)": 45031125, "97.00 percentile latency (ns)": 67555777, "99.00 percentile latency (ns)": 89787574, "99.90 percentile latency (ns)": 100707019, "Max latency (ns)": 112317832, "Mean latency (ns)": 14560577, "Min duration satisfied": "Yes", "Min latency (ns)": 8737199, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 68.47, "QPS w/o loadgen overhead": 68.68, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.275246, "characteristics.90th_percentile_latency_ns": 22275246.0, "characteristics.90th_percentile_latency_s": 0.022275246, "characteristics.90th_percentile_latency_us": 22275.246, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "8d52da74fea85a54", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19178790, "90.00 percentile latency (ns)": 38852916, "90th percentile latency (ns)": 38852916, "95.00 percentile latency (ns)": 83031837, "97.00 percentile latency (ns)": 104816710, "99.00 percentile latency (ns)": 113668641, "99.90 percentile latency (ns)": 122058297, "Max latency (ns)": 128536070, "Mean latency (ns)": 26270045, "Min duration satisfied": "Yes", "Min latency (ns)": 18471522, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 37.96, "QPS w/o loadgen overhead": 38.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 38.852916, "characteristics.90th_percentile_latency_ns": 38852916.0, "characteristics.90th_percentile_latency_s": 0.038852916, "characteristics.90th_percentile_latency_us": 38852.916, "characteristics.accuracy": 68.126, "characteristics.good": 34063, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "8647548a4c852958", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 47920505, "90.00 percentile latency (ns)": 148144554, "90th percentile latency (ns)": 148144554, "95.00 percentile latency (ns)": 187204362, "97.00 percentile latency (ns)": 195508978, "99.00 percentile latency (ns)": 204716307, "99.90 percentile latency (ns)": 216698547, "Max latency (ns)": 230300413, "Mean latency (ns)": 71103859, "Min duration satisfied": "Yes", "Min latency (ns)": 46066091, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.06, "QPS w/o loadgen overhead": 14.06, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 148.144554, "characteristics.90th_percentile_latency_ns": 148144554.0, "characteristics.90th_percentile_latency_s": 0.148144554, "characteristics.90th_percentile_latency_us": 148144.554, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.3333, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "db651a74da1a4956", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 36431825, "90.00 percentile latency (ns)": 175026999, "90th percentile latency (ns)": 175026999, "95.00 percentile latency (ns)": 187267887, "97.00 percentile latency (ns)": 191344378, "99.00 percentile latency (ns)": 197712879, "99.90 percentile latency (ns)": 210563221, "Max latency (ns)": 223541360, "Mean latency (ns)": 65653870, "Min duration satisfied": "Yes", "Min latency (ns)": 25452903, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.22, "QPS w/o loadgen overhead": 15.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 175.026999, "characteristics.90th_percentile_latency_ns": 175026999.0, "characteristics.90th_percentile_latency_s": 0.175026999, "characteristics.90th_percentile_latency_us": 175026.999, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.2857, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "d42c6a80dc112fd1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11452855, "90.00 percentile latency (ns)": 13839854, "90th percentile latency (ns)": 13839854, "95.00 percentile latency (ns)": 21852507, "97.00 percentile latency (ns)": 32943390, "99.00 percentile latency (ns)": 82594100, "99.90 percentile latency (ns)": 108376746, "Max latency (ns)": 121321486, "Mean latency (ns)": 13625916, "Min duration satisfied": "Yes", "Min latency (ns)": 10658358, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 73.18, "QPS w/o loadgen overhead": 73.39, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.839854, "characteristics.90th_percentile_latency_ns": 13839854.0, "characteristics.90th_percentile_latency_s": 0.013839854, "characteristics.90th_percentile_latency_us": 13839.854, "characteristics.accuracy": 64.768, "characteristics.good": 32384, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "7ad9c9ee38376716", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 44642272, "90.00 percentile latency (ns)": 147897162, "90th percentile latency (ns)": 147897162, "95.00 percentile latency (ns)": 192843801, "97.00 percentile latency (ns)": 201030289, "99.00 percentile latency (ns)": 209919503, "99.90 percentile latency (ns)": 221491487, "Max latency (ns)": 229554586, "Mean latency (ns)": 66022015, "Min duration satisfied": "Yes", "Min latency (ns)": 40152632, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.14, "QPS w/o loadgen overhead": 15.15, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 147.897162, "characteristics.90th_percentile_latency_ns": 147897162.0, "characteristics.90th_percentile_latency_s": 0.147897162, "characteristics.90th_percentile_latency_us": 147897.162, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.7059, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "13440b96b9a145cb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11227419, "90.00 percentile latency (ns)": 13519919, "90th percentile latency (ns)": 13519919, "95.00 percentile latency (ns)": 21320382, "97.00 percentile latency (ns)": 32095176, "99.00 percentile latency (ns)": 84510013, "99.90 percentile latency (ns)": 107174909, "Max latency (ns)": 121204556, "Mean latency (ns)": 13308576, "Min duration satisfied": "Yes", "Min latency (ns)": 10308968, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 74.95, "QPS w/o loadgen overhead": 75.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.519919, "characteristics.90th_percentile_latency_ns": 13519919.0, "characteristics.90th_percentile_latency_s": 0.013519919, "characteristics.90th_percentile_latency_us": 13519.919, "characteristics.accuracy": 64.08, "characteristics.good": 32040, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "774392270a44eda5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20220711, "90.00 percentile latency (ns)": 88496231, "90th percentile latency (ns)": 88496231, "95.00 percentile latency (ns)": 159634421, "97.00 percentile latency (ns)": 174246441, "99.00 percentile latency (ns)": 184792827, "99.90 percentile latency (ns)": 197817499, "Max latency (ns)": 217539693, "Mean latency (ns)": 37623406, "Min duration satisfied": "Yes", "Min latency (ns)": 18862706, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 26.55, "QPS w/o loadgen overhead": 26.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 88.496231, "characteristics.90th_percentile_latency_ns": 88496231.0, "characteristics.90th_percentile_latency_s": 0.088496231, "characteristics.90th_percentile_latency_us": 88496.231, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25.641, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "490b9b25e4250ca8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40584579, "90.00 percentile latency (ns)": 136763448, "90th percentile latency (ns)": 136763448, "95.00 percentile latency (ns)": 178781212, "97.00 percentile latency (ns)": 185917151, "99.00 percentile latency (ns)": 194406141, "99.90 percentile latency (ns)": 206307694, "Max latency (ns)": 212562703, "Mean latency (ns)": 61550240, "Min duration satisfied": "Yes", "Min latency (ns)": 37729919, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.24, "QPS w/o loadgen overhead": 16.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 136.763448, "characteristics.90th_percentile_latency_ns": 136763448.0, "characteristics.90th_percentile_latency_s": 0.136763448, "characteristics.90th_percentile_latency_us": 136763.448, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.5135, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "1f4d1928f4e48a29", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13515873, "90.00 percentile latency (ns)": 15632213, "90th percentile latency (ns)": 15632213, "95.00 percentile latency (ns)": 26927257, "97.00 percentile latency (ns)": 38393193, "99.00 percentile latency (ns)": 78908592, "99.90 percentile latency (ns)": 182317462, "Max latency (ns)": 200299919, "Mean latency (ns)": 15952584, "Min duration satisfied": "Yes", "Min latency (ns)": 12071554, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.56, "QPS w/o loadgen overhead": 62.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.632213, "characteristics.90th_percentile_latency_ns": 15632213.0, "characteristics.90th_percentile_latency_s": 0.015632213, "characteristics.90th_percentile_latency_us": 15632.213, "characteristics.accuracy": 64.972, "characteristics.good": 32486, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "4096a56d3372ece1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 55579410, "90.00 percentile latency (ns)": 130705422, "90th percentile latency (ns)": 130705422, "95.00 percentile latency (ns)": 194662733, "97.00 percentile latency (ns)": 209757384, "99.00 percentile latency (ns)": 221322568, "99.90 percentile latency (ns)": 231422724, "Max latency (ns)": 241701021, "Mean latency (ns)": 72978069, "Min duration satisfied": "Yes", "Min latency (ns)": 50042207, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.7, "QPS w/o loadgen overhead": 13.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 130.705422, "characteristics.90th_percentile_latency_ns": 130705422.0, "characteristics.90th_percentile_latency_s": 0.130705422, "characteristics.90th_percentile_latency_us": 130705.422, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 11.4943, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "f8624f4f979376bf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28104014, "90.00 percentile latency (ns)": 167782405, "90th percentile latency (ns)": 167782405, "95.00 percentile latency (ns)": 184891050, "97.00 percentile latency (ns)": 189879478, "99.00 percentile latency (ns)": 196898045, "99.90 percentile latency (ns)": 207462820, "Max latency (ns)": 224065580, "Mean latency (ns)": 57069109, "Min duration satisfied": "Yes", "Min latency (ns)": 22335162, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.51, "QPS w/o loadgen overhead": 17.52, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 167.782405, "characteristics.90th_percentile_latency_ns": 167782405.0, "characteristics.90th_percentile_latency_s": 0.167782405, "characteristics.90th_percentile_latency_us": 167782.405, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "0a193b23917ab66f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10114420, "90.00 percentile latency (ns)": 74626215, "90th percentile latency (ns)": 74626215, "95.00 percentile latency (ns)": 100134153, "97.00 percentile latency (ns)": 119094772, "99.00 percentile latency (ns)": 140332201, "99.90 percentile latency (ns)": 159598885, "Max latency (ns)": 174876717, "Mean latency (ns)": 25676260, "Min duration satisfied": "Yes", "Min latency (ns)": 6165537, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 38.86, "QPS w/o loadgen overhead": 38.95, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 74.626215, "characteristics.90th_percentile_latency_ns": 74626215.0, "characteristics.90th_percentile_latency_s": 0.074626215, "characteristics.90th_percentile_latency_us": 74626.215, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "9845c9824d666dae", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18858132, "90.00 percentile latency (ns)": 146217739, "90th percentile latency (ns)": 146217739, "95.00 percentile latency (ns)": 163071607, "97.00 percentile latency (ns)": 169737105, "99.00 percentile latency (ns)": 178508725, "99.90 percentile latency (ns)": 191660267, "Max latency (ns)": 239562484, "Mean latency (ns)": 46976665, "Min duration satisfied": "Yes", "Min latency (ns)": 11400664, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.26, "QPS w/o loadgen overhead": 21.29, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 146.217739, "characteristics.90th_percentile_latency_ns": 146217739.0, "characteristics.90th_percentile_latency_s": 0.146217739, "characteristics.90th_percentile_latency_us": 146217.739, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.5185, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "1e9a40da94c22bfc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 31269880, "90.00 percentile latency (ns)": 105890323, "90th percentile latency (ns)": 105890323, "95.00 percentile latency (ns)": 109653984, "97.00 percentile latency (ns)": 111758649, "99.00 percentile latency (ns)": 115922671, "99.90 percentile latency (ns)": 124626965, "Max latency (ns)": 141015695, "Mean latency (ns)": 50104368, "Min duration satisfied": "Yes", "Min latency (ns)": 15566977, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.93, "QPS w/o loadgen overhead": 19.96, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 105.890323, "characteristics.90th_percentile_latency_ns": 105890323.0, "characteristics.90th_percentile_latency_s": 0.105890323, "characteristics.90th_percentile_latency_us": 105890.323, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 17.2414, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "47d2b5a2664ade75", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6553749, "90.00 percentile latency (ns)": 7134169, "90th percentile latency (ns)": 7134169, "95.00 percentile latency (ns)": 8682334, "97.00 percentile latency (ns)": 10252375, "99.00 percentile latency (ns)": 34875174, "99.90 percentile latency (ns)": 164025206, "Max latency (ns)": 192250966, "Mean latency (ns)": 7629007, "Min duration satisfied": "Yes", "Min latency (ns)": 5639085, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 130.49, "QPS w/o loadgen overhead": 131.08, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.134169, "characteristics.90th_percentile_latency_ns": 7134169.0, "characteristics.90th_percentile_latency_s": 0.007134169, "characteristics.90th_percentile_latency_us": 7134.169, "characteristics.accuracy": 55.54, "characteristics.good": 27770, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "6eefb664482a3a5f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21515470, "90.00 percentile latency (ns)": 148947822, "90th percentile latency (ns)": 148947822, "95.00 percentile latency (ns)": 168945597, "97.00 percentile latency (ns)": 174662026, "99.00 percentile latency (ns)": 181346891, "99.90 percentile latency (ns)": 192841867, "Max latency (ns)": 203763581, "Mean latency (ns)": 49312902, "Min duration satisfied": "Yes", "Min latency (ns)": 14944785, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.26, "QPS w/o loadgen overhead": 20.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 148.947822, "characteristics.90th_percentile_latency_ns": 148947822.0, "characteristics.90th_percentile_latency_s": 0.148947822, "characteristics.90th_percentile_latency_us": 148947.822, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.625, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "3c9d89f66f3dbbf6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 34575341, "90.00 percentile latency (ns)": 35067145, "90th percentile latency (ns)": 35067145, "95.00 percentile latency (ns)": 36570177, "97.00 percentile latency (ns)": 46531923, "99.00 percentile latency (ns)": 60195429, "99.90 percentile latency (ns)": 109382166, "Max latency (ns)": 124320023, "Mean latency (ns)": 35460325, "Min duration satisfied": "Yes", "Min latency (ns)": 33674769, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 28.18, "QPS w/o loadgen overhead": 28.2, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 35.067145, "characteristics.90th_percentile_latency_ns": 35067145.0, "characteristics.90th_percentile_latency_s": 0.035067145, "characteristics.90th_percentile_latency_us": 35067.145, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.027, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "03aff81349405e7d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 41990312, "90.00 percentile latency (ns)": 42502252, "90th percentile latency (ns)": 42502252, "95.00 percentile latency (ns)": 44559768, "97.00 percentile latency (ns)": 60733015, "99.00 percentile latency (ns)": 71329224, "99.90 percentile latency (ns)": 156436018, "Max latency (ns)": 169781847, "Mean latency (ns)": 43189394, "Min duration satisfied": "Yes", "Min latency (ns)": 41064835, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.14, "QPS w/o loadgen overhead": 23.15, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.502252, "characteristics.90th_percentile_latency_ns": 42502252.0, "characteristics.90th_percentile_latency_s": 0.042502252, "characteristics.90th_percentile_latency_us": 42502.252, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "2247e2a2bc750c69", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 162092451, "90.00 percentile latency (ns)": 182694593, "90th percentile latency (ns)": 182694593, "95.00 percentile latency (ns)": 185520236, "97.00 percentile latency (ns)": 187028054, "99.00 percentile latency (ns)": 196597234, "99.90 percentile latency (ns)": 299178325, "Max latency (ns)": 307633662, "Mean latency (ns)": 165746355, "Min duration satisfied": "Yes", "Min latency (ns)": 160430275, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 6.03, "QPS w/o loadgen overhead": 6.03, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 182.694593, "characteristics.90th_percentile_latency_ns": 182694593.0, "characteristics.90th_percentile_latency_s": 0.182694593, "characteristics.90th_percentile_latency_us": 182694.593, "characteristics.accuracy": 78.514, "characteristics.good": 39257, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 5.91716, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b14516b9630a939c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12042603, "90.00 percentile latency (ns)": 12822551, "90th percentile latency (ns)": 12822551, "95.00 percentile latency (ns)": 13038380, "97.00 percentile latency (ns)": 13163692, "99.00 percentile latency (ns)": 29963640, "99.90 percentile latency (ns)": 47836677, "Max latency (ns)": 129364113, "Mean latency (ns)": 12546515, "Min duration satisfied": "Yes", "Min latency (ns)": 11146085, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 79.5, "QPS w/o loadgen overhead": 79.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.822551, "characteristics.90th_percentile_latency_ns": 12822551.0, "characteristics.90th_percentile_latency_s": 0.012822551, "characteristics.90th_percentile_latency_us": 12822.551, "characteristics.accuracy": 63.542, "characteristics.good": 31771, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "c108b9502704c409", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8427168, "90.00 percentile latency (ns)": 8959461, "90th percentile latency (ns)": 8959461, "95.00 percentile latency (ns)": 9105531, "97.00 percentile latency (ns)": 9241173, "99.00 percentile latency (ns)": 12785740, "99.90 percentile latency (ns)": 44216719, "Max latency (ns)": 121545854, "Mean latency (ns)": 8737590, "Min duration satisfied": "Yes", "Min latency (ns)": 7565002, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 113.88, "QPS w/o loadgen overhead": 114.45, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.959461, "characteristics.90th_percentile_latency_ns": 8959461.0, "characteristics.90th_percentile_latency_s": 0.008959461, "characteristics.90th_percentile_latency_us": 8959.461, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b01db0f5ca5e4173", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10233682, "90.00 percentile latency (ns)": 10890783, "90th percentile latency (ns)": 10890783, "95.00 percentile latency (ns)": 11004552, "97.00 percentile latency (ns)": 11090738, "99.00 percentile latency (ns)": 18851660, "99.90 percentile latency (ns)": 49247363, "Max latency (ns)": 127791980, "Mean latency (ns)": 10655567, "Min duration satisfied": "Yes", "Min latency (ns)": 9430542, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 93.56, "QPS w/o loadgen overhead": 93.85, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.890783, "characteristics.90th_percentile_latency_ns": 10890783.0, "characteristics.90th_percentile_latency_s": 0.010890783, "characteristics.90th_percentile_latency_us": 10890.783, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "9ed3246f2942aae6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21720922, "90.00 percentile latency (ns)": 22050171, "90th percentile latency (ns)": 22050171, "95.00 percentile latency (ns)": 22268965, "97.00 percentile latency (ns)": 23652768, "99.00 percentile latency (ns)": 50511591, "99.90 percentile latency (ns)": 95245518, "Max latency (ns)": 149496854, "Mean latency (ns)": 22385494, "Min duration satisfied": "Yes", "Min latency (ns)": 21079696, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 44.63, "QPS w/o loadgen overhead": 44.67, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.050171, "characteristics.90th_percentile_latency_ns": 22050171.0, "characteristics.90th_percentile_latency_s": 0.022050171, "characteristics.90th_percentile_latency_us": 22050.171, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "03644b8936bd1266", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3974564, "90.00 percentile latency (ns)": 4691901, "90th percentile latency (ns)": 4691901, "95.00 percentile latency (ns)": 4863156, "97.00 percentile latency (ns)": 4949507, "99.00 percentile latency (ns)": 5169205, "99.90 percentile latency (ns)": 36868462, "Max latency (ns)": 77357768, "Mean latency (ns)": 4222208, "Min duration satisfied": "Yes", "Min latency (ns)": 3406576, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 234.76, "QPS w/o loadgen overhead": 236.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.691901, "characteristics.90th_percentile_latency_ns": 4691901.0, "characteristics.90th_percentile_latency_s": 0.004691901, "characteristics.90th_percentile_latency_us": 4691.901, "characteristics.accuracy": 48.162, "characteristics.good": 24081, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "ff496ae5be180e7e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 67664091, "90.00 percentile latency (ns)": 68728100, "90th percentile latency (ns)": 68728100, "95.00 percentile latency (ns)": 82694627, "97.00 percentile latency (ns)": 92542461, "99.00 percentile latency (ns)": 96499362, "99.90 percentile latency (ns)": 184719690, "Max latency (ns)": 192401399, "Mean latency (ns)": 69408019, "Min duration satisfied": "Yes", "Min latency (ns)": 66203908, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.4, "QPS w/o loadgen overhead": 14.41, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 68.7281, "characteristics.90th_percentile_latency_ns": 68728100.0, "characteristics.90th_percentile_latency_s": 0.0687281, "characteristics.90th_percentile_latency_us": 68728.1, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.2857, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "3dfcf56442eacecc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5170703, "90.00 percentile latency (ns)": 5760347, "90th percentile latency (ns)": 5760347, "95.00 percentile latency (ns)": 5845417, "97.00 percentile latency (ns)": 5987713, "99.00 percentile latency (ns)": 6366979, "99.90 percentile latency (ns)": 38316674, "Max latency (ns)": 81320842, "Mean latency (ns)": 5420017, "Min duration satisfied": "Yes", "Min latency (ns)": 4491685, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 182.93, "QPS w/o loadgen overhead": 184.5, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.760347, "characteristics.90th_percentile_latency_ns": 5760347.0, "characteristics.90th_percentile_latency_s": 0.005760347, "characteristics.90th_percentile_latency_us": 5760.347, "characteristics.accuracy": 50.242, "characteristics.good": 25121, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "cec4c4db0b00a5b1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14559803, "90.00 percentile latency (ns)": 14886336, "90th percentile latency (ns)": 14886336, "95.00 percentile latency (ns)": 15050347, "97.00 percentile latency (ns)": 15399911, "99.00 percentile latency (ns)": 36829958, "99.90 percentile latency (ns)": 72604231, "Max latency (ns)": 98686002, "Mean latency (ns)": 14981959, "Min duration satisfied": "Yes", "Min latency (ns)": 13866986, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 66.65, "QPS w/o loadgen overhead": 66.75, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.886336, "characteristics.90th_percentile_latency_ns": 14886336.0, "characteristics.90th_percentile_latency_s": 0.014886336, "characteristics.90th_percentile_latency_us": 14886.336, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f5ff888cc4483d96", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 31831370, "90.00 percentile latency (ns)": 32344671, "90th percentile latency (ns)": 32344671, "95.00 percentile latency (ns)": 32948824, "97.00 percentile latency (ns)": 42498263, "99.00 percentile latency (ns)": 61671090, "99.90 percentile latency (ns)": 132842784, "Max latency (ns)": 166811257, "Mean latency (ns)": 32789503, "Min duration satisfied": "Yes", "Min latency (ns)": 31003200, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 30.48, "QPS w/o loadgen overhead": 30.5, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 32.344671, "characteristics.90th_percentile_latency_ns": 32344671.0, "characteristics.90th_percentile_latency_s": 0.032344671, "characteristics.90th_percentile_latency_us": 32344.671, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 28.5714, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "2305946999f68a32", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 46756209, "90.00 percentile latency (ns)": 47387771, "90th percentile latency (ns)": 47387771, "95.00 percentile latency (ns)": 50937863, "97.00 percentile latency (ns)": 72091760, "99.00 percentile latency (ns)": 76413065, "99.90 percentile latency (ns)": 164039828, "Max latency (ns)": 196242063, "Mean latency (ns)": 48023536, "Min duration satisfied": "Yes", "Min latency (ns)": 45416955, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.81, "QPS w/o loadgen overhead": 20.82, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 47.387771, "characteristics.90th_percentile_latency_ns": 47387771.0, "characteristics.90th_percentile_latency_s": 0.047387771, "characteristics.90th_percentile_latency_us": 47387.771, "characteristics.accuracy": 74.098, "characteristics.good": 37049, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20.4082, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "a4be69403c86f081", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9300569, "90.00 percentile latency (ns)": 9839735, "90th percentile latency (ns)": 9839735, "95.00 percentile latency (ns)": 9986101, "97.00 percentile latency (ns)": 10103655, "99.00 percentile latency (ns)": 15433810, "99.90 percentile latency (ns)": 45212863, "Max latency (ns)": 129642837, "Mean latency (ns)": 9677034, "Min duration satisfied": "Yes", "Min latency (ns)": 8551982, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 103.06, "QPS w/o loadgen overhead": 103.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.839735, "characteristics.90th_percentile_latency_ns": 9839735.0, "characteristics.90th_percentile_latency_s": 0.009839735, "characteristics.90th_percentile_latency_us": 9839.735, "characteristics.accuracy": 61.924, "characteristics.good": 30962, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "75b44388988c730e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10450859, "90.00 percentile latency (ns)": 11085027, "90th percentile latency (ns)": 11085027, "95.00 percentile latency (ns)": 11202529, "97.00 percentile latency (ns)": 11436019, "99.00 percentile latency (ns)": 23366240, "99.90 percentile latency (ns)": 50006687, "Max latency (ns)": 92572933, "Mean latency (ns)": 10865066, "Min duration satisfied": "Yes", "Min latency (ns)": 9721962, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 91.76, "QPS w/o loadgen overhead": 92.04, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.085027, "characteristics.90th_percentile_latency_ns": 11085027.0, "characteristics.90th_percentile_latency_s": 0.011085027, "characteristics.90th_percentile_latency_us": 11085.027, "characteristics.accuracy": 62.298, "characteristics.good": 31149, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "dbed5c8f42c4a5f4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4164915, "90.00 percentile latency (ns)": 4799920, "90th percentile latency (ns)": 4799920, "95.00 percentile latency (ns)": 4964637, "97.00 percentile latency (ns)": 5107283, "99.00 percentile latency (ns)": 5385924, "99.90 percentile latency (ns)": 37704345, "Max latency (ns)": 118063193, "Mean latency (ns)": 4423729, "Min duration satisfied": "Yes", "Min latency (ns)": 3733480, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 223.93, "QPS w/o loadgen overhead": 226.05, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.79992, "characteristics.90th_percentile_latency_ns": 4799920.0, "characteristics.90th_percentile_latency_s": 0.00479992, "characteristics.90th_percentile_latency_us": 4799.92, "characteristics.accuracy": 49.12, "characteristics.good": 24560, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b411d468995cf37e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 39569493, "90.00 percentile latency (ns)": 40158040, "90th percentile latency (ns)": 40158040, "95.00 percentile latency (ns)": 40961886, "97.00 percentile latency (ns)": 57958025, "99.00 percentile latency (ns)": 67856257, "99.90 percentile latency (ns)": 133270824, "Max latency (ns)": 169298856, "Mean latency (ns)": 40634399, "Min duration satisfied": "Yes", "Min latency (ns)": 38249700, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 24.59, "QPS w/o loadgen overhead": 24.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.15804, "characteristics.90th_percentile_latency_ns": 40158040.0, "characteristics.90th_percentile_latency_s": 0.04015804, "characteristics.90th_percentile_latency_us": 40158.04, "characteristics.accuracy": 73.584, "characteristics.good": 36792, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 24.3902, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "61619306487e8277", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28523266, "90.00 percentile latency (ns)": 29170159, "90th percentile latency (ns)": 29170159, "95.00 percentile latency (ns)": 29445384, "97.00 percentile latency (ns)": 36745900, "99.00 percentile latency (ns)": 54293374, "99.90 percentile latency (ns)": 100987466, "Max latency (ns)": 129260598, "Mean latency (ns)": 29323948, "Min duration satisfied": "Yes", "Min latency (ns)": 27540484, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.07, "QPS w/o loadgen overhead": 34.1, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.170159, "characteristics.90th_percentile_latency_ns": 29170159.0, "characteristics.90th_percentile_latency_s": 0.029170159, "characteristics.90th_percentile_latency_us": 29170.159, "characteristics.accuracy": 70.772, "characteristics.good": 35386, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 32.2581, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "584d71405458c975", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7198060, "90.00 percentile latency (ns)": 7441224, "90th percentile latency (ns)": 7441224, "95.00 percentile latency (ns)": 7528257, "97.00 percentile latency (ns)": 7596182, "99.00 percentile latency (ns)": 8960806, "99.90 percentile latency (ns)": 41811556, "Max latency (ns)": 81812146, "Mean latency (ns)": 7422100, "Min duration satisfied": "Yes", "Min latency (ns)": 6579164, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 134.39, "QPS w/o loadgen overhead": 134.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.441224, "characteristics.90th_percentile_latency_ns": 7441224.0, "characteristics.90th_percentile_latency_s": 0.007441224, "characteristics.90th_percentile_latency_us": 7441.224, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "4dd5bb84d313bef0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16766070, "90.00 percentile latency (ns)": 17421359, "90th percentile latency (ns)": 17421359, "95.00 percentile latency (ns)": 17622700, "97.00 percentile latency (ns)": 18065109, "99.00 percentile latency (ns)": 42251845, "99.90 percentile latency (ns)": 76600673, "Max latency (ns)": 150810689, "Mean latency (ns)": 17346805, "Min duration satisfied": "Yes", "Min latency (ns)": 15801037, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.53, "QPS w/o loadgen overhead": 57.65, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.421359, "characteristics.90th_percentile_latency_ns": 17421359.0, "characteristics.90th_percentile_latency_s": 0.017421359, "characteristics.90th_percentile_latency_us": 17421.359, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "2ca2713d516593d7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13421761, "90.00 percentile latency (ns)": 13698625, "90th percentile latency (ns)": 13698625, "95.00 percentile latency (ns)": 13804327, "97.00 percentile latency (ns)": 14021989, "99.00 percentile latency (ns)": 35096555, "99.90 percentile latency (ns)": 67775585, "Max latency (ns)": 97925574, "Mean latency (ns)": 13829230, "Min duration satisfied": "Yes", "Min latency (ns)": 12819050, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 72.2, "QPS w/o loadgen overhead": 72.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.698625, "characteristics.90th_percentile_latency_ns": 13698625.0, "characteristics.90th_percentile_latency_s": 0.013698625, "characteristics.90th_percentile_latency_us": 13698.625, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b2e9a919c2e5f006", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7328832, "90.00 percentile latency (ns)": 7960636, "90th percentile latency (ns)": 7960636, "95.00 percentile latency (ns)": 8134555, "97.00 percentile latency (ns)": 8260674, "99.00 percentile latency (ns)": 9970528, "99.90 percentile latency (ns)": 40666120, "Max latency (ns)": 118481831, "Mean latency (ns)": 7646349, "Min duration satisfied": "Yes", "Min latency (ns)": 6610371, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 130.24, "QPS w/o loadgen overhead": 130.78, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.960636, "characteristics.90th_percentile_latency_ns": 7960636.0, "characteristics.90th_percentile_latency_s": 0.007960636, "characteristics.90th_percentile_latency_us": 7960.636, "characteristics.accuracy": 59.226, "characteristics.good": 29613, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f887ca2f69f7eabd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15872213, "90.00 percentile latency (ns)": 16442220, "90th percentile latency (ns)": 16442220, "95.00 percentile latency (ns)": 16640545, "97.00 percentile latency (ns)": 16966543, "99.00 percentile latency (ns)": 38451482, "99.90 percentile latency (ns)": 74839651, "Max latency (ns)": 90416649, "Mean latency (ns)": 16395777, "Min duration satisfied": "Yes", "Min latency (ns)": 15057858, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 60.89, "QPS w/o loadgen overhead": 60.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.44222, "characteristics.90th_percentile_latency_ns": 16442220.0, "characteristics.90th_percentile_latency_s": 0.01644222, "characteristics.90th_percentile_latency_us": 16442.22, "characteristics.accuracy": 68.248, "characteristics.good": 34124, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "48f6ba87b5ebccbd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6415153, "90.00 percentile latency (ns)": 7121232, "90th percentile latency (ns)": 7121232, "95.00 percentile latency (ns)": 7270980, "97.00 percentile latency (ns)": 7406394, "99.00 percentile latency (ns)": 8449677, "99.90 percentile latency (ns)": 40466557, "Max latency (ns)": 122506380, "Mean latency (ns)": 6763174, "Min duration satisfied": "Yes", "Min latency (ns)": 5856571, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 147.04, "QPS w/o loadgen overhead": 147.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.121232, "characteristics.90th_percentile_latency_ns": 7121232.0, "characteristics.90th_percentile_latency_s": 0.007121232, "characteristics.90th_percentile_latency_us": 7121.232, "characteristics.accuracy": 59.12, "characteristics.good": 29560, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "feb9026432bb06d0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7014627, "90.00 percentile latency (ns)": 7665856, "90th percentile latency (ns)": 7665856, "95.00 percentile latency (ns)": 7795516, "97.00 percentile latency (ns)": 7934297, "99.00 percentile latency (ns)": 11482872, "99.90 percentile latency (ns)": 40186819, "Max latency (ns)": 85614421, "Mean latency (ns)": 7342133, "Min duration satisfied": "Yes", "Min latency (ns)": 6463637, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 135.54, "QPS w/o loadgen overhead": 136.2, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.665856, "characteristics.90th_percentile_latency_ns": 7665856.0, "characteristics.90th_percentile_latency_s": 0.007665856, "characteristics.90th_percentile_latency_us": 7665.856, "characteristics.accuracy": 58.46, "characteristics.good": 29230, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "33d324e8a80460a6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26387339, "90.00 percentile latency (ns)": 27060358, "90th percentile latency (ns)": 27060358, "95.00 percentile latency (ns)": 27372410, "97.00 percentile latency (ns)": 31150265, "99.00 percentile latency (ns)": 54631213, "99.90 percentile latency (ns)": 107314416, "Max latency (ns)": 148023456, "Mean latency (ns)": 27203248, "Min duration satisfied": "Yes", "Min latency (ns)": 25360967, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 36.71, "QPS w/o loadgen overhead": 36.76, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 27.060358, "characteristics.90th_percentile_latency_ns": 27060358.0, "characteristics.90th_percentile_latency_s": 0.027060358, "characteristics.90th_percentile_latency_us": 27060.358, "characteristics.accuracy": 72.91, "characteristics.good": 36455, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 35.7143, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "48f91523c14e3694", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 24031350, "90.00 percentile latency (ns)": 24679691, "90th percentile latency (ns)": 24679691, "95.00 percentile latency (ns)": 25015696, "97.00 percentile latency (ns)": 27186625, "99.00 percentile latency (ns)": 52576458, "99.90 percentile latency (ns)": 102878653, "Max latency (ns)": 156155783, "Mean latency (ns)": 24821674, "Min duration satisfied": "Yes", "Min latency (ns)": 23307981, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 40.23, "QPS w/o loadgen overhead": 40.29, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.679691, "characteristics.90th_percentile_latency_ns": 24679691.0, "characteristics.90th_percentile_latency_s": 0.024679691, "characteristics.90th_percentile_latency_us": 24679.691, "characteristics.accuracy": 70.542, "characteristics.good": 35271, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "723742ce475fa7be", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7443421, "90.00 percentile latency (ns)": 7991429, "90th percentile latency (ns)": 7991429, "95.00 percentile latency (ns)": 8106403, "97.00 percentile latency (ns)": 8232666, "99.00 percentile latency (ns)": 10562265, "99.90 percentile latency (ns)": 41953602, "Max latency (ns)": 123320932, "Mean latency (ns)": 7757026, "Min duration satisfied": "Yes", "Min latency (ns)": 6706114, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 128.36, "QPS w/o loadgen overhead": 128.92, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.991429, "characteristics.90th_percentile_latency_ns": 7991429.0, "characteristics.90th_percentile_latency_s": 0.007991429, "characteristics.90th_percentile_latency_us": 7991.429, "characteristics.accuracy": 56.594, "characteristics.good": 28297, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "63c8b861a6408fa0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13599398, "90.00 percentile latency (ns)": 14252029, "90th percentile latency (ns)": 14252029, "95.00 percentile latency (ns)": 14472820, "97.00 percentile latency (ns)": 14626802, "99.00 percentile latency (ns)": 36730180, "99.90 percentile latency (ns)": 52897911, "Max latency (ns)": 137741048, "Mean latency (ns)": 14112140, "Min duration satisfied": "Yes", "Min latency (ns)": 12747671, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 70.72, "QPS w/o loadgen overhead": 70.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.252029, "characteristics.90th_percentile_latency_ns": 14252029.0, "characteristics.90th_percentile_latency_s": 0.014252029, "characteristics.90th_percentile_latency_us": 14252.029, "characteristics.accuracy": 67.82, "characteristics.good": 33910, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "6f31dd4c4fa5ae91", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4710108, "90.00 percentile latency (ns)": 5222671, "90th percentile latency (ns)": 5222671, "95.00 percentile latency (ns)": 5438481, "97.00 percentile latency (ns)": 5551312, "99.00 percentile latency (ns)": 6221706, "99.90 percentile latency (ns)": 39752852, "Max latency (ns)": 82402588, "Mean latency (ns)": 4922644, "Min duration satisfied": "Yes", "Min latency (ns)": 4096213, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 201.52, "QPS w/o loadgen overhead": 203.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.222671, "characteristics.90th_percentile_latency_ns": 5222671.0, "characteristics.90th_percentile_latency_s": 0.005222671, "characteristics.90th_percentile_latency_us": 5222.671, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "67aa4e3a8e8e45c5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2984470, "90.00 percentile latency (ns)": 3590441, "90th percentile latency (ns)": 3590441, "95.00 percentile latency (ns)": 3745604, "97.00 percentile latency (ns)": 3935710, "99.00 percentile latency (ns)": 4146539, "99.90 percentile latency (ns)": 35560513, "Max latency (ns)": 72447002, "Mean latency (ns)": 3173152, "Min duration satisfied": "Yes", "Min latency (ns)": 2506276, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 311.24, "QPS w/o loadgen overhead": 315.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.590441, "characteristics.90th_percentile_latency_ns": 3590441.0, "characteristics.90th_percentile_latency_s": 0.003590441, "characteristics.90th_percentile_latency_us": 3590.441, "characteristics.accuracy": 45.494, "characteristics.good": 22747, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f71b0e2ae4e91aac", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 52569062, "90.00 percentile latency (ns)": 53315044, "90th percentile latency (ns)": 53315044, "95.00 percentile latency (ns)": 61573380, "97.00 percentile latency (ns)": 69989332, "99.00 percentile latency (ns)": 78454509, "99.90 percentile latency (ns)": 132094300, "Max latency (ns)": 153030446, "Mean latency (ns)": 53791603, "Min duration satisfied": "Yes", "Min latency (ns)": 51267942, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.58, "QPS w/o loadgen overhead": 18.59, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 53.315044, "characteristics.90th_percentile_latency_ns": 53315044.0, "characteristics.90th_percentile_latency_s": 0.053315044, "characteristics.90th_percentile_latency_us": 53315.044, "characteristics.accuracy": 70.626, "characteristics.good": 35313, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 17.8571, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "5abaf1f07ff49f8a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9338868, "90.00 percentile latency (ns)": 9898754, "90th percentile latency (ns)": 9898754, "95.00 percentile latency (ns)": 10043472, "97.00 percentile latency (ns)": 10165187, "99.00 percentile latency (ns)": 16680091, "99.90 percentile latency (ns)": 45878728, "Max latency (ns)": 142598327, "Mean latency (ns)": 9724423, "Min duration satisfied": "Yes", "Min latency (ns)": 8629957, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 102.52, "QPS w/o loadgen overhead": 102.83, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.898754, "characteristics.90th_percentile_latency_ns": 9898754.0, "characteristics.90th_percentile_latency_s": 0.009898754, "characteristics.90th_percentile_latency_us": 9898.754, "characteristics.accuracy": 63.454, "characteristics.good": 31727, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "6f35ae4104804a95", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21434494, "90.00 percentile latency (ns)": 22059354, "90th percentile latency (ns)": 22059354, "95.00 percentile latency (ns)": 22327123, "97.00 percentile latency (ns)": 23871663, "99.00 percentile latency (ns)": 47152124, "99.90 percentile latency (ns)": 82661789, "Max latency (ns)": 112760963, "Mean latency (ns)": 22069422, "Min duration satisfied": "Yes", "Min latency (ns)": 20505149, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 45.2, "QPS w/o loadgen overhead": 45.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.059354, "characteristics.90th_percentile_latency_ns": 22059354.0, "characteristics.90th_percentile_latency_s": 0.022059354, "characteristics.90th_percentile_latency_us": 22059.354, "characteristics.accuracy": 70.04, "characteristics.good": 35020, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "417db323bba91d3a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 63829267, "90.00 percentile latency (ns)": 64608132, "90th percentile latency (ns)": 64608132, "95.00 percentile latency (ns)": 81285867, "97.00 percentile latency (ns)": 88853366, "99.00 percentile latency (ns)": 91467600, "99.90 percentile latency (ns)": 184169896, "Max latency (ns)": 214979046, "Mean latency (ns)": 65449195, "Min duration satisfied": "Yes", "Min latency (ns)": 62406231, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.27, "QPS w/o loadgen overhead": 15.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 64.608132, "characteristics.90th_percentile_latency_ns": 64608132.0, "characteristics.90th_percentile_latency_s": 0.064608132, "characteristics.90th_percentile_latency_us": 64608.132, "characteristics.accuracy": 74.124, "characteristics.good": 37062, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.9254, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "1daf368f7c4c9690", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5990726, "90.00 percentile latency (ns)": 6638291, "90th percentile latency (ns)": 6638291, "95.00 percentile latency (ns)": 6757048, "97.00 percentile latency (ns)": 6882059, "99.00 percentile latency (ns)": 7858596, "99.90 percentile latency (ns)": 39165756, "Max latency (ns)": 79187662, "Mean latency (ns)": 6278313, "Min duration satisfied": "Yes", "Min latency (ns)": 5434438, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 158.36, "QPS w/o loadgen overhead": 159.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.638291, "characteristics.90th_percentile_latency_ns": 6638291.0, "characteristics.90th_percentile_latency_s": 0.006638291, "characteristics.90th_percentile_latency_us": 6638.291, "characteristics.accuracy": 59.444, "characteristics.good": 29722, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "2adc115d893a4cfe", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8056815, "90.00 percentile latency (ns)": 8755910, "90th percentile latency (ns)": 8755910, "95.00 percentile latency (ns)": 8900888, "97.00 percentile latency (ns)": 8998942, "99.00 percentile latency (ns)": 13753866, "99.90 percentile latency (ns)": 41350696, "Max latency (ns)": 86070410, "Mean latency (ns)": 8419986, "Min duration satisfied": "Yes", "Min latency (ns)": 7341608, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 118.38, "QPS w/o loadgen overhead": 118.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.75591, "characteristics.90th_percentile_latency_ns": 8755910.0, "characteristics.90th_percentile_latency_s": 0.00875591, "characteristics.90th_percentile_latency_us": 8755.91, "characteristics.accuracy": 61.456, "characteristics.good": 30728, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "cc8a74c4b82bbaa9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9595900, "90.00 percentile latency (ns)": 10214761, "90th percentile latency (ns)": 10214761, "95.00 percentile latency (ns)": 10401645, "97.00 percentile latency (ns)": 10509902, "99.00 percentile latency (ns)": 15822954, "99.90 percentile latency (ns)": 45006282, "Max latency (ns)": 151492909, "Mean latency (ns)": 10000702, "Min duration satisfied": "Yes", "Min latency (ns)": 8760051, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 99.72, "QPS w/o loadgen overhead": 99.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.214761, "characteristics.90th_percentile_latency_ns": 10214761.0, "characteristics.90th_percentile_latency_s": 0.010214761, "characteristics.90th_percentile_latency_us": 10214.761, "characteristics.accuracy": 58.528, "characteristics.good": 29264, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "39e4c17747e1a05c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21965984, "90.00 percentile latency (ns)": 22641562, "90th percentile latency (ns)": 22641562, "95.00 percentile latency (ns)": 22974334, "97.00 percentile latency (ns)": 26597594, "99.00 percentile latency (ns)": 52437351, "99.90 percentile latency (ns)": 136752654, "Max latency (ns)": 151250797, "Mean latency (ns)": 22923624, "Min duration satisfied": "Yes", "Min latency (ns)": 21027633, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 43.55, "QPS w/o loadgen overhead": 43.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.641562, "characteristics.90th_percentile_latency_ns": 22641562.0, "characteristics.90th_percentile_latency_s": 0.022641562, "characteristics.90th_percentile_latency_us": 22641.562, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "82bc3096461cb5d9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 95420062, "90.00 percentile latency (ns)": 98668026, "90th percentile latency (ns)": 98668026, "95.00 percentile latency (ns)": 117257676, "97.00 percentile latency (ns)": 120272644, "99.00 percentile latency (ns)": 124676952, "99.90 percentile latency (ns)": 249585139, "Max latency (ns)": 260516940, "Mean latency (ns)": 97737335, "Min duration satisfied": "Yes", "Min latency (ns)": 93680137, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.23, "QPS w/o loadgen overhead": 10.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 98.668026, "characteristics.90th_percentile_latency_ns": 98668026.0, "characteristics.90th_percentile_latency_s": 0.098668026, "characteristics.90th_percentile_latency_us": 98668.026, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.101, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "298578838c02e32e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18379194, "90.00 percentile latency (ns)": 19049235, "90th percentile latency (ns)": 19049235, "95.00 percentile latency (ns)": 19269281, "97.00 percentile latency (ns)": 19602645, "99.00 percentile latency (ns)": 46625847, "99.90 percentile latency (ns)": 82746696, "Max latency (ns)": 155697083, "Mean latency (ns)": 19019574, "Min duration satisfied": "Yes", "Min latency (ns)": 17569183, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 52.44, "QPS w/o loadgen overhead": 52.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.049235, "characteristics.90th_percentile_latency_ns": 19049235.0, "characteristics.90th_percentile_latency_s": 0.019049235, "characteristics.90th_percentile_latency_us": 19049.235, "characteristics.accuracy": 69.604, "characteristics.good": 34802, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 52.6316, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "df039a91e411593d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 45935552, "90.00 percentile latency (ns)": 46474513, "90th percentile latency (ns)": 46474513, "95.00 percentile latency (ns)": 51214695, "97.00 percentile latency (ns)": 63174585, "99.00 percentile latency (ns)": 71406537, "99.90 percentile latency (ns)": 122483644, "Max latency (ns)": 135690018, "Mean latency (ns)": 47042807, "Min duration satisfied": "Yes", "Min latency (ns)": 44988500, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.25, "QPS w/o loadgen overhead": 21.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 46.474513, "characteristics.90th_percentile_latency_ns": 46474513.0, "characteristics.90th_percentile_latency_s": 0.046474513, "characteristics.90th_percentile_latency_us": 46474.513, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "a146b08d68991ccf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19981489, "90.00 percentile latency (ns)": 20466345, "90th percentile latency (ns)": 20466345, "95.00 percentile latency (ns)": 20751726, "97.00 percentile latency (ns)": 21154509, "99.00 percentile latency (ns)": 48718113, "99.90 percentile latency (ns)": 79722247, "Max latency (ns)": 149265924, "Mean latency (ns)": 20628925, "Min duration satisfied": "Yes", "Min latency (ns)": 19110480, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 48.35, "QPS w/o loadgen overhead": 48.48, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.466345, "characteristics.90th_percentile_latency_ns": 20466345.0, "characteristics.90th_percentile_latency_s": 0.020466345, "characteristics.90th_percentile_latency_us": 20466.345, "characteristics.accuracy": 68.734, "characteristics.good": 34367, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "92b6d28fcf6e494d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16432399, "90.00 percentile latency (ns)": 16714764, "90th percentile latency (ns)": 16714764, "95.00 percentile latency (ns)": 16914779, "97.00 percentile latency (ns)": 17295641, "99.00 percentile latency (ns)": 39525974, "99.90 percentile latency (ns)": 89558419, "Max latency (ns)": 112846419, "Mean latency (ns)": 16923876, "Min duration satisfied": "Yes", "Min latency (ns)": 15871949, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 59.01, "QPS w/o loadgen overhead": 59.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.714764, "characteristics.90th_percentile_latency_ns": 16714764.0, "characteristics.90th_percentile_latency_s": 0.016714764, "characteristics.90th_percentile_latency_us": 16714.764, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "8dca4ed6b957808c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9557442, "90.00 percentile latency (ns)": 10106448, "90th percentile latency (ns)": 10106448, "95.00 percentile latency (ns)": 10241705, "97.00 percentile latency (ns)": 10371102, "99.00 percentile latency (ns)": 18982589, "99.90 percentile latency (ns)": 54680545, "Max latency (ns)": 91177085, "Mean latency (ns)": 9910146, "Min duration satisfied": "Yes", "Min latency (ns)": 8684363, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 100.51, "QPS w/o loadgen overhead": 100.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.106448, "characteristics.90th_percentile_latency_ns": 10106448.0, "characteristics.90th_percentile_latency_s": 0.010106448, "characteristics.90th_percentile_latency_us": 10106.448, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f91f0714cda940b5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 68427325, "90.00 percentile latency (ns)": 69552097, "90th percentile latency (ns)": 69552097, "95.00 percentile latency (ns)": 82122609, "97.00 percentile latency (ns)": 89516212, "99.00 percentile latency (ns)": 93838674, "99.90 percentile latency (ns)": 159916364, "Max latency (ns)": 176765064, "Mean latency (ns)": 69911091, "Min duration satisfied": "Yes", "Min latency (ns)": 66086986, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.3, "QPS w/o loadgen overhead": 14.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 69.552097, "characteristics.90th_percentile_latency_ns": 69552097.0, "characteristics.90th_percentile_latency_s": 0.069552097, "characteristics.90th_percentile_latency_us": 69552.097, "characteristics.accuracy": 71.676, "characteristics.good": 35838, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.0845, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f8f8ca0870982b05", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3070046, "90.00 percentile latency (ns)": 3559850, "90th percentile latency (ns)": 3559850, "95.00 percentile latency (ns)": 3698866, "97.00 percentile latency (ns)": 3780327, "99.00 percentile latency (ns)": 4052617, "99.90 percentile latency (ns)": 36065807, "Max latency (ns)": 111121191, "Mean latency (ns)": 3242272, "Min duration satisfied": "Yes", "Min latency (ns)": 2484448, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 305.12, "QPS w/o loadgen overhead": 308.43, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.55985, "characteristics.90th_percentile_latency_ns": 3559850.0, "characteristics.90th_percentile_latency_s": 0.00355985, "characteristics.90th_percentile_latency_us": 3559.85, "characteristics.accuracy": 43.468, "characteristics.good": 21734, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "890c9144cdb879f7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 330079270, "90.00 percentile latency (ns)": 350427079, "90th percentile latency (ns)": 350427079, "95.00 percentile latency (ns)": 353426040, "97.00 percentile latency (ns)": 357431632, "99.00 percentile latency (ns)": 429357518, "99.90 percentile latency (ns)": 474229017, "Max latency (ns)": 482662101, "Mean latency (ns)": 336223383, "Min duration satisfied": "Yes", "Min latency (ns)": 326448781, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.97, "QPS w/o loadgen overhead": 2.97, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 350.427079, "characteristics.90th_percentile_latency_ns": 350427079.0, "characteristics.90th_percentile_latency_s": 0.350427079, "characteristics.90th_percentile_latency_us": 350427.079, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.92398, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "d84c1cf52925237c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18894790, "90.00 percentile latency (ns)": 19465112, "90th percentile latency (ns)": 19465112, "95.00 percentile latency (ns)": 19722347, "97.00 percentile latency (ns)": 20044822, "99.00 percentile latency (ns)": 47347197, "99.90 percentile latency (ns)": 80132253, "Max latency (ns)": 140914622, "Mean latency (ns)": 19533076, "Min duration satisfied": "Yes", "Min latency (ns)": 18179358, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 51.06, "QPS w/o loadgen overhead": 51.2, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.465112, "characteristics.90th_percentile_latency_ns": 19465112.0, "characteristics.90th_percentile_latency_s": 0.019465112, "characteristics.90th_percentile_latency_us": 19465.112, "characteristics.accuracy": 70.43, "characteristics.good": 35215, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "e9eeb0882c9a2626", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15256829, "90.00 percentile latency (ns)": 15910566, "90th percentile latency (ns)": 15910566, "95.00 percentile latency (ns)": 16094666, "97.00 percentile latency (ns)": 16249330, "99.00 percentile latency (ns)": 42332926, "99.90 percentile latency (ns)": 87900753, "Max latency (ns)": 148539955, "Mean latency (ns)": 15835616, "Min duration satisfied": "Yes", "Min latency (ns)": 14397372, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 63.02, "QPS w/o loadgen overhead": 63.15, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.910566, "characteristics.90th_percentile_latency_ns": 15910566.0, "characteristics.90th_percentile_latency_s": 0.015910566, "characteristics.90th_percentile_latency_us": 15910.566, "characteristics.accuracy": 67.474, "characteristics.good": 33737, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "477ca0bbd1dafa82", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13668701, "90.00 percentile latency (ns)": 14394435, "90th percentile latency (ns)": 14394435, "95.00 percentile latency (ns)": 14557471, "97.00 percentile latency (ns)": 14717121, "99.00 percentile latency (ns)": 35523322, "99.90 percentile latency (ns)": 63682258, "Max latency (ns)": 98666412, "Mean latency (ns)": 14233795, "Min duration satisfied": "Yes", "Min latency (ns)": 12960931, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 70.11, "QPS w/o loadgen overhead": 70.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.394435, "characteristics.90th_percentile_latency_ns": 14394435.0, "characteristics.90th_percentile_latency_s": 0.014394435, "characteristics.90th_percentile_latency_us": 14394.435, "characteristics.accuracy": 67.24, "characteristics.good": 33620, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "e4e56bf4b77242d9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26168277, "90.00 percentile latency (ns)": 26620914, "90th percentile latency (ns)": 26620914, "95.00 percentile latency (ns)": 27045092, "97.00 percentile latency (ns)": 30618763, "99.00 percentile latency (ns)": 52579949, "99.90 percentile latency (ns)": 89425149, "Max latency (ns)": 103197620, "Mean latency (ns)": 26880241, "Min duration satisfied": "Yes", "Min latency (ns)": 25486157, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 37.17, "QPS w/o loadgen overhead": 37.2, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.620914, "characteristics.90th_percentile_latency_ns": 26620914.0, "characteristics.90th_percentile_latency_s": 0.026620914, "characteristics.90th_percentile_latency_us": 26620.914, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 35.7143, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "c3ad9e2e35e2b8b9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19227164, "90.00 percentile latency (ns)": 19637300, "90th percentile latency (ns)": 19637300, "95.00 percentile latency (ns)": 19874902, "97.00 percentile latency (ns)": 20611335, "99.00 percentile latency (ns)": 44813237, "99.90 percentile latency (ns)": 80380695, "Max latency (ns)": 108718551, "Mean latency (ns)": 19799138, "Min duration satisfied": "Yes", "Min latency (ns)": 18658056, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 50.43, "QPS w/o loadgen overhead": 50.51, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.6373, "characteristics.90th_percentile_latency_ns": 19637300.0, "characteristics.90th_percentile_latency_s": 0.0196373, "characteristics.90th_percentile_latency_us": 19637.3, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "c341ad3ad632434e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15245960, "90.00 percentile latency (ns)": 15653747, "90th percentile latency (ns)": 15653747, "95.00 percentile latency (ns)": 15992302, "97.00 percentile latency (ns)": 16236844, "99.00 percentile latency (ns)": 39295594, "99.90 percentile latency (ns)": 73318723, "Max latency (ns)": 138368876, "Mean latency (ns)": 15764963, "Min duration satisfied": "Yes", "Min latency (ns)": 14587256, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 63.34, "QPS w/o loadgen overhead": 63.43, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.653747, "characteristics.90th_percentile_latency_ns": 15653747.0, "characteristics.90th_percentile_latency_s": 0.015653747, "characteristics.90th_percentile_latency_us": 15653.747, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "4f648e79c5bc45c0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26042473, "90.00 percentile latency (ns)": 26499408, "90th percentile latency (ns)": 26499408, "95.00 percentile latency (ns)": 26980581, "97.00 percentile latency (ns)": 32779201, "99.00 percentile latency (ns)": 53528211, "99.90 percentile latency (ns)": 97700102, "Max latency (ns)": 112756157, "Mean latency (ns)": 26826970, "Min duration satisfied": "Yes", "Min latency (ns)": 24819924, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 37.25, "QPS w/o loadgen overhead": 37.28, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.499408, "characteristics.90th_percentile_latency_ns": 26499408.0, "characteristics.90th_percentile_latency_s": 0.026499408, "characteristics.90th_percentile_latency_us": 26499.408, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 34.4828, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "2086d8ad804154ba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3656164, "90.00 percentile latency (ns)": 4201463, "90th percentile latency (ns)": 4201463, "95.00 percentile latency (ns)": 4410809, "97.00 percentile latency (ns)": 4515673, "99.00 percentile latency (ns)": 4727734, "99.90 percentile latency (ns)": 36335888, "Max latency (ns)": 121167060, "Mean latency (ns)": 3854363, "Min duration satisfied": "Yes", "Min latency (ns)": 3065173, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 257.34, "QPS w/o loadgen overhead": 259.45, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.201463, "characteristics.90th_percentile_latency_ns": 4201463.0, "characteristics.90th_percentile_latency_s": 0.004201463, "characteristics.90th_percentile_latency_us": 4201.463, "characteristics.accuracy": 49.11, "characteristics.good": 24555, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "6356f9b3284c50b2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7844752, "90.00 percentile latency (ns)": 8443447, "90th percentile latency (ns)": 8443447, "95.00 percentile latency (ns)": 8545668, "97.00 percentile latency (ns)": 8648277, "99.00 percentile latency (ns)": 11244444, "99.90 percentile latency (ns)": 42064909, "Max latency (ns)": 139771299, "Mean latency (ns)": 8185469, "Min duration satisfied": "Yes", "Min latency (ns)": 7140973, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 121.77, "QPS w/o loadgen overhead": 122.17, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.443447, "characteristics.90th_percentile_latency_ns": 8443447.0, "characteristics.90th_percentile_latency_s": 0.008443447, "characteristics.90th_percentile_latency_us": 8443.447, "characteristics.accuracy": 62.07, "characteristics.good": 31035, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "18fbeab27fb4e7aa", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15713543, "90.00 percentile latency (ns)": 16392021, "90th percentile latency (ns)": 16392021, "95.00 percentile latency (ns)": 16643609, "97.00 percentile latency (ns)": 17042405, "99.00 percentile latency (ns)": 37723399, "99.90 percentile latency (ns)": 81375224, "Max latency (ns)": 139775124, "Mean latency (ns)": 16305375, "Min duration satisfied": "Yes", "Min latency (ns)": 14690904, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 61.23, "QPS w/o loadgen overhead": 61.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.392021, "characteristics.90th_percentile_latency_ns": 16392021.0, "characteristics.90th_percentile_latency_s": 0.016392021, "characteristics.90th_percentile_latency_us": 16392.021, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "ff31c6a4b3cae1bb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2152567, "90.00 percentile latency (ns)": 2850664, "90th percentile latency (ns)": 2850664, "95.00 percentile latency (ns)": 2952921, "97.00 percentile latency (ns)": 3047345, "99.00 percentile latency (ns)": 3228156, "99.90 percentile latency (ns)": 34381533, "Max latency (ns)": 81181014, "Mean latency (ns)": 2366757, "Min duration satisfied": "Yes", "Min latency (ns)": 1662725, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 416.57, "QPS w/o loadgen overhead": 422.52, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.850664, "characteristics.90th_percentile_latency_ns": 2850664.0, "characteristics.90th_percentile_latency_s": 0.002850664, "characteristics.90th_percentile_latency_us": 2850.664, "characteristics.accuracy": 42.384, "characteristics.good": 21192, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "459bf945ff70ff34", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 82086556, "90.00 percentile latency (ns)": 83343415, "90th percentile latency (ns)": 83343415, "95.00 percentile latency (ns)": 101159311, "97.00 percentile latency (ns)": 106704484, "99.00 percentile latency (ns)": 111438896, "99.90 percentile latency (ns)": 200731389, "Max latency (ns)": 226904541, "Mean latency (ns)": 84034952, "Min duration satisfied": "Yes", "Min latency (ns)": 80490824, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 11.9, "QPS w/o loadgen overhead": 11.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 83.343415, "characteristics.90th_percentile_latency_ns": 83343415.0, "characteristics.90th_percentile_latency_s": 0.083343415, "characteristics.90th_percentile_latency_us": 83343.415, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 11.6279, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "71a6343869e12f7a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10747063, "90.00 percentile latency (ns)": 11305860, "90th percentile latency (ns)": 11305860, "95.00 percentile latency (ns)": 11494677, "97.00 percentile latency (ns)": 11720615, "99.00 percentile latency (ns)": 23146178, "99.90 percentile latency (ns)": 43860714, "Max latency (ns)": 100204931, "Mean latency (ns)": 11096487, "Min duration satisfied": "Yes", "Min latency (ns)": 9900288, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.82, "QPS w/o loadgen overhead": 90.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.30586, "characteristics.90th_percentile_latency_ns": 11305860.0, "characteristics.90th_percentile_latency_s": 0.01130586, "characteristics.90th_percentile_latency_us": 11305.86, "characteristics.accuracy": 64.486, "characteristics.good": 32243, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "674354e11b63290e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 128071312, "90.00 percentile latency (ns)": 139293186, "90th percentile latency (ns)": 139293186, "95.00 percentile latency (ns)": 150048960, "97.00 percentile latency (ns)": 152106359, "99.00 percentile latency (ns)": 157359306, "99.90 percentile latency (ns)": 272677015, "Max latency (ns)": 284267384, "Mean latency (ns)": 130864251, "Min duration satisfied": "Yes", "Min latency (ns)": 126188867, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.64, "QPS w/o loadgen overhead": 7.64, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 139.293186, "characteristics.90th_percentile_latency_ns": 139293186.0, "characteristics.90th_percentile_latency_s": 0.139293186, "characteristics.90th_percentile_latency_us": 139293.186, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.35294, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "c442a3a80e828e01", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4178899, "90.00 percentile latency (ns)": 4880912, "90th percentile latency (ns)": 4880912, "95.00 percentile latency (ns)": 5071806, "97.00 percentile latency (ns)": 5172673, "99.00 percentile latency (ns)": 5416338, "99.90 percentile latency (ns)": 37373800, "Max latency (ns)": 77531325, "Mean latency (ns)": 4448973, "Min duration satisfied": "Yes", "Min latency (ns)": 3767146, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 222.7, "QPS w/o loadgen overhead": 224.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.880912, "characteristics.90th_percentile_latency_ns": 4880912.0, "characteristics.90th_percentile_latency_s": 0.004880912, "characteristics.90th_percentile_latency_us": 4880.912, "characteristics.accuracy": 56.75, "characteristics.good": 28375, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "5948130d79346d3c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5400985, "90.00 percentile latency (ns)": 6066045, "90th percentile latency (ns)": 6066045, "95.00 percentile latency (ns)": 6195358, "97.00 percentile latency (ns)": 6266189, "99.00 percentile latency (ns)": 6645312, "99.90 percentile latency (ns)": 38567047, "Max latency (ns)": 130290540, "Mean latency (ns)": 5692032, "Min duration satisfied": "Yes", "Min latency (ns)": 4859292, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 174.31, "QPS w/o loadgen overhead": 175.68, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.066045, "characteristics.90th_percentile_latency_ns": 6066045.0, "characteristics.90th_percentile_latency_s": 0.006066045, "characteristics.90th_percentile_latency_us": 6066.045, "characteristics.accuracy": 57.002, "characteristics.good": 28501, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b4cae9056a1ec29a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 88732418, "90.00 percentile latency (ns)": 90014897, "90th percentile latency (ns)": 90014897, "95.00 percentile latency (ns)": 112182507, "97.00 percentile latency (ns)": 114949333, "99.00 percentile latency (ns)": 118762262, "99.90 percentile latency (ns)": 216066724, "Max latency (ns)": 237982198, "Mean latency (ns)": 90949848, "Min duration satisfied": "Yes", "Min latency (ns)": 86974488, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.99, "QPS w/o loadgen overhead": 11.0, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 90.014897, "characteristics.90th_percentile_latency_ns": 90014897.0, "characteristics.90th_percentile_latency_s": 0.090014897, "characteristics.90th_percentile_latency_us": 90014.897, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.6383, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "83e7088b6d4f35b3", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6900583, "90.00 percentile latency (ns)": 7654810, "90th percentile latency (ns)": 7654810, "95.00 percentile latency (ns)": 7836954, "97.00 percentile latency (ns)": 7972060, "99.00 percentile latency (ns)": 10098180, "99.90 percentile latency (ns)": 41416479, "Max latency (ns)": 119594786, "Mean latency (ns)": 7220589, "Min duration satisfied": "Yes", "Min latency (ns)": 6193453, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 137.64, "QPS w/o loadgen overhead": 138.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.65481, "characteristics.90th_percentile_latency_ns": 7654810.0, "characteristics.90th_percentile_latency_s": 0.00765481, "characteristics.90th_percentile_latency_us": 7654.81, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "783a8dda571f24b6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40034075, "90.00 percentile latency (ns)": 40643336, "90th percentile latency (ns)": 40643336, "95.00 percentile latency (ns)": 42310806, "97.00 percentile latency (ns)": 55493518, "99.00 percentile latency (ns)": 68292713, "99.90 percentile latency (ns)": 144549753, "Max latency (ns)": 177165584, "Mean latency (ns)": 41130886, "Min duration satisfied": "Yes", "Min latency (ns)": 39399309, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 24.3, "QPS w/o loadgen overhead": 24.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.643336, "characteristics.90th_percentile_latency_ns": 40643336.0, "characteristics.90th_percentile_latency_s": 0.040643336, "characteristics.90th_percentile_latency_us": 40643.336, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.7273, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "450f9724f4f7e9be", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30109897, "90.00 percentile latency (ns)": 30776339, "90th percentile latency (ns)": 30776339, "95.00 percentile latency (ns)": 31468039, "97.00 percentile latency (ns)": 40356827, "99.00 percentile latency (ns)": 58559720, "99.90 percentile latency (ns)": 102258722, "Max latency (ns)": 117605580, "Mean latency (ns)": 31036026, "Min duration satisfied": "Yes", "Min latency (ns)": 29034062, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 32.19, "QPS w/o loadgen overhead": 32.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 30.776339, "characteristics.90th_percentile_latency_ns": 30776339.0, "characteristics.90th_percentile_latency_s": 0.030776339, "characteristics.90th_percentile_latency_us": 30776.339, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 30.303, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "cf6eb74376b80cfb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 41161187, "90.00 percentile latency (ns)": 42135232, "90th percentile latency (ns)": 42135232, "95.00 percentile latency (ns)": 46264747, "97.00 percentile latency (ns)": 55361231, "99.00 percentile latency (ns)": 66380324, "99.90 percentile latency (ns)": 117010824, "Max latency (ns)": 135704927, "Mean latency (ns)": 42208715, "Min duration satisfied": "Yes", "Min latency (ns)": 39866641, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.68, "QPS w/o loadgen overhead": 23.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.135232, "characteristics.90th_percentile_latency_ns": 42135232.0, "characteristics.90th_percentile_latency_s": 0.042135232, "characteristics.90th_percentile_latency_us": 42135.232, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 23.2558, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "14f92909243d6914", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11111142, "90.00 percentile latency (ns)": 11740089, "90th percentile latency (ns)": 11740089, "95.00 percentile latency (ns)": 11950656, "97.00 percentile latency (ns)": 12156816, "99.00 percentile latency (ns)": 25403378, "99.90 percentile latency (ns)": 49829056, "Max latency (ns)": 133821685, "Mean latency (ns)": 11576414, "Min duration satisfied": "Yes", "Min latency (ns)": 10265987, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 86.12, "QPS w/o loadgen overhead": 86.38, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.740089, "characteristics.90th_percentile_latency_ns": 11740089.0, "characteristics.90th_percentile_latency_s": 0.011740089, "characteristics.90th_percentile_latency_us": 11740.089, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b4a299ec2a1a19f5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20071378, "90.00 percentile latency (ns)": 20476027, "90th percentile latency (ns)": 20476027, "95.00 percentile latency (ns)": 20750456, "97.00 percentile latency (ns)": 22005336, "99.00 percentile latency (ns)": 47274006, "99.90 percentile latency (ns)": 98665285, "Max latency (ns)": 112908053, "Mean latency (ns)": 20681404, "Min duration satisfied": "Yes", "Min latency (ns)": 19354186, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 48.29, "QPS w/o loadgen overhead": 48.35, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.476027, "characteristics.90th_percentile_latency_ns": 20476027.0, "characteristics.90th_percentile_latency_s": 0.020476027, "characteristics.90th_percentile_latency_us": 20476.027, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 45.4545, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "684b07e9cf99df0d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 33028614, "90.00 percentile latency (ns)": 33421635, "90th percentile latency (ns)": 33421635, "95.00 percentile latency (ns)": 34216803, "97.00 percentile latency (ns)": 43834235, "99.00 percentile latency (ns)": 60609376, "99.90 percentile latency (ns)": 131377652, "Max latency (ns)": 161012980, "Mean latency (ns)": 33962779, "Min duration satisfied": "Yes", "Min latency (ns)": 32468713, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 29.42, "QPS w/o loadgen overhead": 29.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.421635, "characteristics.90th_percentile_latency_ns": 33421635.0, "characteristics.90th_percentile_latency_s": 0.033421635, "characteristics.90th_percentile_latency_us": 33421.635, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.7778, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "1be4d06942ffaaf4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 31451829, "90.00 percentile latency (ns)": 32083738, "90th percentile latency (ns)": 32083738, "95.00 percentile latency (ns)": 32430373, "97.00 percentile latency (ns)": 41180554, "99.00 percentile latency (ns)": 60013656, "99.90 percentile latency (ns)": 112404293, "Max latency (ns)": 161733637, "Mean latency (ns)": 32383627, "Min duration satisfied": "Yes", "Min latency (ns)": 30615635, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 30.85, "QPS w/o loadgen overhead": 30.88, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 32.083738, "characteristics.90th_percentile_latency_ns": 32083738.0, "characteristics.90th_percentile_latency_s": 0.032083738, "characteristics.90th_percentile_latency_us": 32083.738, "characteristics.accuracy": 71.19, "characteristics.good": 35595, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 29.4118, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "cb1af61046af9ecd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 192227408, "90.00 percentile latency (ns)": 211456137, "90th percentile latency (ns)": 211456137, "95.00 percentile latency (ns)": 215048742, "97.00 percentile latency (ns)": 217075044, "99.00 percentile latency (ns)": 237112187, "99.90 percentile latency (ns)": 333504941, "Max latency (ns)": 343034144, "Mean latency (ns)": 196175451, "Min duration satisfied": "Yes", "Min latency (ns)": 190174694, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.1, "QPS w/o loadgen overhead": 5.1, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 211.456137, "characteristics.90th_percentile_latency_ns": 211456137.0, "characteristics.90th_percentile_latency_s": 0.211456137, "characteristics.90th_percentile_latency_us": 211456.137, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.92611, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "744afb98c309f0bb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 17684190, "90.00 percentile latency (ns)": 17964205, "90th percentile latency (ns)": 17964205, "95.00 percentile latency (ns)": 18214430, "97.00 percentile latency (ns)": 18624223, "99.00 percentile latency (ns)": 42920960, "99.90 percentile latency (ns)": 94354312, "Max latency (ns)": 115229144, "Mean latency (ns)": 18200962, "Min duration satisfied": "Yes", "Min latency (ns)": 17052978, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 54.87, "QPS w/o loadgen overhead": 54.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.964205, "characteristics.90th_percentile_latency_ns": 17964205.0, "characteristics.90th_percentile_latency_s": 0.017964205, "characteristics.90th_percentile_latency_us": 17964.205, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 52.6316, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "0144dc9b4f4c9a87", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 95513637, "90.00 percentile latency (ns)": 97845640, "90th percentile latency (ns)": 97845640, "95.00 percentile latency (ns)": 118102153, "97.00 percentile latency (ns)": 120115314, "99.00 percentile latency (ns)": 124181094, "99.90 percentile latency (ns)": 235837196, "Max latency (ns)": 272873641, "Mean latency (ns)": 97798288, "Min duration satisfied": "Yes", "Min latency (ns)": 93930555, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.22, "QPS w/o loadgen overhead": 10.23, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 97.84564, "characteristics.90th_percentile_latency_ns": 97845640.0, "characteristics.90th_percentile_latency_s": 0.09784564, "characteristics.90th_percentile_latency_us": 97845.64, "characteristics.accuracy": 76.344, "characteristics.good": 38172, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 9.90099, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "4f2f8fc9018e430e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5645941, "90.00 percentile latency (ns)": 6294034, "90th percentile latency (ns)": 6294034, "95.00 percentile latency (ns)": 6466004, "97.00 percentile latency (ns)": 6546258, "99.00 percentile latency (ns)": 6939588, "99.90 percentile latency (ns)": 39441827, "Max latency (ns)": 121397203, "Mean latency (ns)": 5931408, "Min duration satisfied": "Yes", "Min latency (ns)": 5063384, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 167.31, "QPS w/o loadgen overhead": 168.59, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.294034, "characteristics.90th_percentile_latency_ns": 6294034.0, "characteristics.90th_percentile_latency_s": 0.006294034, "characteristics.90th_percentile_latency_us": 6294.034, "characteristics.accuracy": 54.568, "characteristics.good": 27284, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "9322237ba0a4534b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9622225, "90.00 percentile latency (ns)": 9879571, "90th percentile latency (ns)": 9879571, "95.00 percentile latency (ns)": 10020752, "97.00 percentile latency (ns)": 10214766, "99.00 percentile latency (ns)": 26496282, "99.90 percentile latency (ns)": 68882699, "Max latency (ns)": 82792572, "Mean latency (ns)": 10054290, "Min duration satisfied": "Yes", "Min latency (ns)": 9172751, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 99.27, "QPS w/o loadgen overhead": 99.46, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.879571, "characteristics.90th_percentile_latency_ns": 9879571.0, "characteristics.90th_percentile_latency_s": 0.009879571, "characteristics.90th_percentile_latency_us": 9879.571, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "9644ea0400e81997", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18572484, "90.00 percentile latency (ns)": 19252682, "90th percentile latency (ns)": 19252682, "95.00 percentile latency (ns)": 19560003, "97.00 percentile latency (ns)": 20086015, "99.00 percentile latency (ns)": 44814149, "99.90 percentile latency (ns)": 85487903, "Max latency (ns)": 111258196, "Mean latency (ns)": 19222600, "Min duration satisfied": "Yes", "Min latency (ns)": 17786896, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 51.9, "QPS w/o loadgen overhead": 52.02, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.252682, "characteristics.90th_percentile_latency_ns": 19252682.0, "characteristics.90th_percentile_latency_s": 0.019252682, "characteristics.90th_percentile_latency_us": 19252.682, "characteristics.accuracy": 68.126, "characteristics.good": 34063, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "48629b937b48a588", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 52115418, "90.00 percentile latency (ns)": 52623891, "90th percentile latency (ns)": 52623891, "95.00 percentile latency (ns)": 59713531, "97.00 percentile latency (ns)": 74872415, "99.00 percentile latency (ns)": 80939794, "99.90 percentile latency (ns)": 161925628, "Max latency (ns)": 175032423, "Mean latency (ns)": 53488101, "Min duration satisfied": "Yes", "Min latency (ns)": 51156747, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.69, "QPS w/o loadgen overhead": 18.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 52.623891, "characteristics.90th_percentile_latency_ns": 52623891.0, "characteristics.90th_percentile_latency_s": 0.052623891, "characteristics.90th_percentile_latency_us": 52623.891, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.8679, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "626ac64932b89cb9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 27521512, "90.00 percentile latency (ns)": 27926061, "90th percentile latency (ns)": 27926061, "95.00 percentile latency (ns)": 28374246, "97.00 percentile latency (ns)": 30554156, "99.00 percentile latency (ns)": 55295500, "99.90 percentile latency (ns)": 123514129, "Max latency (ns)": 147412670, "Mean latency (ns)": 28351997, "Min duration satisfied": "Yes", "Min latency (ns)": 26996248, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 35.25, "QPS w/o loadgen overhead": 35.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 27.926061, "characteristics.90th_percentile_latency_ns": 27926061.0, "characteristics.90th_percentile_latency_s": 0.027926061, "characteristics.90th_percentile_latency_us": 27926.061, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 33.3333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b64ffc9826de0189", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10706553, "90.00 percentile latency (ns)": 11322450, "90th percentile latency (ns)": 11322450, "95.00 percentile latency (ns)": 11466316, "97.00 percentile latency (ns)": 11606829, "99.00 percentile latency (ns)": 24456432, "99.90 percentile latency (ns)": 52585934, "Max latency (ns)": 96069165, "Mean latency (ns)": 11094303, "Min duration satisfied": "Yes", "Min latency (ns)": 9988121, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.83, "QPS w/o loadgen overhead": 90.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.32245, "characteristics.90th_percentile_latency_ns": 11322450.0, "characteristics.90th_percentile_latency_s": 0.01132245, "characteristics.90th_percentile_latency_us": 11322.45, "characteristics.accuracy": 64.768, "characteristics.good": 32384, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "9d7ba44dd52b1175", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 43749182, "90.00 percentile latency (ns)": 44326201, "90th percentile latency (ns)": 44326201, "95.00 percentile latency (ns)": 47045334, "97.00 percentile latency (ns)": 61259847, "99.00 percentile latency (ns)": 73714323, "99.90 percentile latency (ns)": 149084630, "Max latency (ns)": 180312079, "Mean latency (ns)": 44957628, "Min duration satisfied": "Yes", "Min latency (ns)": 43010994, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 22.23, "QPS w/o loadgen overhead": 22.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 44.326201, "characteristics.90th_percentile_latency_ns": 44326201.0, "characteristics.90th_percentile_latency_s": 0.044326201, "characteristics.90th_percentile_latency_us": 44326.201, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20.8333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "b44623a51b6e5152", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10393800, "90.00 percentile latency (ns)": 11075466, "90th percentile latency (ns)": 11075466, "95.00 percentile latency (ns)": 11295614, "97.00 percentile latency (ns)": 11416016, "99.00 percentile latency (ns)": 22653234, "99.90 percentile latency (ns)": 52824850, "Max latency (ns)": 88912672, "Mean latency (ns)": 10804600, "Min duration satisfied": "Yes", "Min latency (ns)": 9706848, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 92.31, "QPS w/o loadgen overhead": 92.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.075466, "characteristics.90th_percentile_latency_ns": 11075466.0, "characteristics.90th_percentile_latency_s": 0.011075466, "characteristics.90th_percentile_latency_us": 11075.466, "characteristics.accuracy": 64.08, "characteristics.good": 32040, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "fa9975b9d4e0e8f6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20547761, "90.00 percentile latency (ns)": 20855041, "90th percentile latency (ns)": 20855041, "95.00 percentile latency (ns)": 21052314, "97.00 percentile latency (ns)": 21662074, "99.00 percentile latency (ns)": 49719195, "99.90 percentile latency (ns)": 96935021, "Max latency (ns)": 160271968, "Mean latency (ns)": 21189448, "Min duration satisfied": "Yes", "Min latency (ns)": 19968947, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 47.14, "QPS w/o loadgen overhead": 47.19, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.855041, "characteristics.90th_percentile_latency_ns": 20855041.0, "characteristics.90th_percentile_latency_s": 0.020855041, "characteristics.90th_percentile_latency_us": 20855.041, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 45.4545, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f08098f20cd5ccdc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 41816715, "90.00 percentile latency (ns)": 42298497, "90th percentile latency (ns)": 42298497, "95.00 percentile latency (ns)": 44406956, "97.00 percentile latency (ns)": 60291571, "99.00 percentile latency (ns)": 72287741, "99.90 percentile latency (ns)": 147313691, "Max latency (ns)": 183488709, "Mean latency (ns)": 42992537, "Min duration satisfied": "Yes", "Min latency (ns)": 41057294, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.25, "QPS w/o loadgen overhead": 23.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.298497, "characteristics.90th_percentile_latency_ns": 42298497.0, "characteristics.90th_percentile_latency_s": 0.042298497, "characteristics.90th_percentile_latency_us": 42298.497, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "4af43d18f6d045a9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11597588, "90.00 percentile latency (ns)": 12210520, "90th percentile latency (ns)": 12210520, "95.00 percentile latency (ns)": 12436729, "97.00 percentile latency (ns)": 12548845, "99.00 percentile latency (ns)": 28002087, "99.90 percentile latency (ns)": 49344680, "Max latency (ns)": 133243274, "Mean latency (ns)": 11995013, "Min duration satisfied": "Yes", "Min latency (ns)": 10723619, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 83.17, "QPS w/o loadgen overhead": 83.37, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.21052, "characteristics.90th_percentile_latency_ns": 12210520.0, "characteristics.90th_percentile_latency_s": 0.01221052, "characteristics.90th_percentile_latency_us": 12210.52, "characteristics.accuracy": 64.972, "characteristics.good": 32486, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "54487faa644d7e88", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 55572980, "90.00 percentile latency (ns)": 56202380, "90th percentile latency (ns)": 56202380, "95.00 percentile latency (ns)": 66237486, "97.00 percentile latency (ns)": 80544763, "99.00 percentile latency (ns)": 85679996, "99.90 percentile latency (ns)": 167039778, "Max latency (ns)": 188782830, "Mean latency (ns)": 57094492, "Min duration satisfied": "Yes", "Min latency (ns)": 54471640, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.51, "QPS w/o loadgen overhead": 17.51, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 56.20238, "characteristics.90th_percentile_latency_ns": 56202380.0, "characteristics.90th_percentile_latency_s": 0.05620238, "characteristics.90th_percentile_latency_us": 56202.38, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "3883d2701f7a78b2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 24482948, "90.00 percentile latency (ns)": 24856321, "90th percentile latency (ns)": 24856321, "95.00 percentile latency (ns)": 25279330, "97.00 percentile latency (ns)": 28023364, "99.00 percentile latency (ns)": 52943666, "99.90 percentile latency (ns)": 110063298, "Max latency (ns)": 156256434, "Mean latency (ns)": 25214687, "Min duration satisfied": "Yes", "Min latency (ns)": 23646478, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 39.63, "QPS w/o loadgen overhead": 39.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.856321, "characteristics.90th_percentile_latency_ns": 24856321.0, "characteristics.90th_percentile_latency_s": 0.024856321, "characteristics.90th_percentile_latency_us": 24856.321, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "7a886c9f99d537e7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5654583, "90.00 percentile latency (ns)": 6291792, "90th percentile latency (ns)": 6291792, "95.00 percentile latency (ns)": 6442048, "97.00 percentile latency (ns)": 6571007, "99.00 percentile latency (ns)": 7630004, "99.90 percentile latency (ns)": 39619779, "Max latency (ns)": 121039902, "Mean latency (ns)": 5932313, "Min duration satisfied": "Yes", "Min latency (ns)": 5152261, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 167.29, "QPS w/o loadgen overhead": 168.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.291792, "characteristics.90th_percentile_latency_ns": 6291792.0, "characteristics.90th_percentile_latency_s": 0.006291792, "characteristics.90th_percentile_latency_us": 6291.792, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f9da54880abab7dc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11834592, "90.00 percentile latency (ns)": 12196489, "90th percentile latency (ns)": 12196489, "95.00 percentile latency (ns)": 12454343, "97.00 percentile latency (ns)": 12725329, "99.00 percentile latency (ns)": 27823745, "99.90 percentile latency (ns)": 50016437, "Max latency (ns)": 142495947, "Mean latency (ns)": 12257433, "Min duration satisfied": "Yes", "Min latency (ns)": 11154554, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 81.43, "QPS w/o loadgen overhead": 81.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.196489, "characteristics.90th_percentile_latency_ns": 12196489.0, "characteristics.90th_percentile_latency_s": 0.012196489, "characteristics.90th_percentile_latency_us": 12196.489, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "7d476e95f7252551", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18104919, "90.00 percentile latency (ns)": 18777635, "90th percentile latency (ns)": 18777635, "95.00 percentile latency (ns)": 19042974, "97.00 percentile latency (ns)": 20009230, "99.00 percentile latency (ns)": 44162000, "99.90 percentile latency (ns)": 79089605, "Max latency (ns)": 97511620, "Mean latency (ns)": 18738861, "Min duration satisfied": "Yes", "Min latency (ns)": 17204076, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 53.22, "QPS w/o loadgen overhead": 53.37, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.777635, "characteristics.90th_percentile_latency_ns": 18777635.0, "characteristics.90th_percentile_latency_s": 0.018777635, "characteristics.90th_percentile_latency_us": 18777.635, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "3dac429699c96159", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5175158, "90.00 percentile latency (ns)": 5782868, "90th percentile latency (ns)": 5782868, "95.00 percentile latency (ns)": 5997715, "97.00 percentile latency (ns)": 6112567, "99.00 percentile latency (ns)": 6439097, "99.90 percentile latency (ns)": 38650917, "Max latency (ns)": 115610075, "Mean latency (ns)": 5444768, "Min duration satisfied": "Yes", "Min latency (ns)": 4635668, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 182.46, "QPS w/o loadgen overhead": 183.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.782868, "characteristics.90th_percentile_latency_ns": 5782868.0, "characteristics.90th_percentile_latency_s": 0.005782868, "characteristics.90th_percentile_latency_us": 5782.868, "characteristics.accuracy": 55.54, "characteristics.good": 27770, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "e1844bf85291da55", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16638030, "90.00 percentile latency (ns)": 16981933, "90th percentile latency (ns)": 16981933, "95.00 percentile latency (ns)": 17238576, "97.00 percentile latency (ns)": 17535106, "99.00 percentile latency (ns)": 42544779, "99.90 percentile latency (ns)": 95881346, "Max latency (ns)": 148072032, "Mean latency (ns)": 17179475, "Min duration satisfied": "Yes", "Min latency (ns)": 16088412, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 58.13, "QPS w/o loadgen overhead": 58.21, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.981933, "characteristics.90th_percentile_latency_ns": 16981933.0, "characteristics.90th_percentile_latency_s": 0.016981933, "characteristics.90th_percentile_latency_us": 16981.933, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "a84583a5f592bbd4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 407943838, "90.00 percentile latency (ns)": 492011821, "90th percentile latency (ns)": 492011821, "95.00 percentile latency (ns)": 517999290, "97.00 percentile latency (ns)": 526708070, "99.00 percentile latency (ns)": 542772414, "99.90 percentile latency (ns)": 561651309, "Max latency (ns)": 567638809, "Mean latency (ns)": 401206749, "Min duration satisfied": "Yes", "Min latency (ns)": 309164543, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.49, "QPS w/o loadgen overhead": 2.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 492.011821, "characteristics.90th_percentile_latency_ns": 492011821.0, "characteristics.90th_percentile_latency_s": 0.492011821, "characteristics.90th_percentile_latency_us": 492011.821, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 3.138292181235072, "characteristics.power.normalized_per_core": 0.392286522654384, "characteristics.power.normalized_per_processor": 3.138292181235072, "characteristics.total": 50000, "ck_system": "xavier-power.2-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_15W", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.2-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.2-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.5, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "9761ed9449aa1b6e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 81749329, "90.00 percentile latency (ns)": 86848938, "90th percentile latency (ns)": 86848938, "95.00 percentile latency (ns)": 90958179, "97.00 percentile latency (ns)": 95179347, "99.00 percentile latency (ns)": 101553741, "99.90 percentile latency (ns)": 168817721, "Max latency (ns)": 228939300, "Mean latency (ns)": 81525886, "Min duration satisfied": "Yes", "Min latency (ns)": 73707718, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.26, "QPS w/o loadgen overhead": 12.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 86.848938, "characteristics.90th_percentile_latency_ns": 86848938.0, "characteristics.90th_percentile_latency_s": 0.086848938, "characteristics.90th_percentile_latency_us": 86848.938, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 2.2692211502651807, "characteristics.power.normalized_per_core": 0.2836526437831476, "characteristics.power.normalized_per_processor": 2.2692211502651807, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.5, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "42ec8a7f4e01dc49", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 157467016, "90.00 percentile latency (ns)": 251867040, "90th percentile latency (ns)": 251867040, "95.00 percentile latency (ns)": 256426334, "97.00 percentile latency (ns)": 259289467, "99.00 percentile latency (ns)": 267009722, "99.90 percentile latency (ns)": 276770992, "Max latency (ns)": 304786208, "Mean latency (ns)": 179884537, "Min duration satisfied": "Yes", "Min latency (ns)": 129398052, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.56, "QPS w/o loadgen overhead": 5.56, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 251.86704, "characteristics.90th_percentile_latency_ns": 251867040.0, "characteristics.90th_percentile_latency_s": 0.25186704, "characteristics.90th_percentile_latency_us": 251867.04, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 1.5147797802841088, "characteristics.power.normalized_per_core": 0.1893474725355136, "characteristics.power.normalized_per_processor": 1.5147797802841088, "characteristics.total": 50000, "ck_system": "xavier-power.3-fan.cool-armnn-v21.05-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.05 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_30W_ALL", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.3-fan.cool-armnn-v21.05-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.3-fan.cool-armnn-v21.05-neon", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "e9da4f6ab2373cf7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 156584585, "90.00 percentile latency (ns)": 259068378, "90th percentile latency (ns)": 259068378, "95.00 percentile latency (ns)": 264106053, "97.00 percentile latency (ns)": 266863766, "99.00 percentile latency (ns)": 273830197, "99.90 percentile latency (ns)": 297270047, "Max latency (ns)": 321363778, "Mean latency (ns)": 182928268, "Min duration satisfied": "Yes", "Min latency (ns)": 138950099, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.46, "QPS w/o loadgen overhead": 5.47, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 259.068378, "characteristics.90th_percentile_latency_ns": 259068378.0, "characteristics.90th_percentile_latency_s": 0.259068378, "characteristics.90th_percentile_latency_us": 259068.378, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 1.6230753794345656, "characteristics.power.normalized_per_core": 0.2028844224293207, "characteristics.power.normalized_per_processor": 1.6230753794345656, "characteristics.total": 50000, "ck_system": "xavier-power.4-fan.cool-armnn-v21.05-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.05 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_30W_6CORE", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.4-fan.cool-armnn-v21.05-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.4-fan.cool-armnn-v21.05-neon", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "8d7042c584e136db", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 57554560, "90.00 percentile latency (ns)": 72084529, "90th percentile latency (ns)": 72084529, "95.00 percentile latency (ns)": 77972086, "97.00 percentile latency (ns)": 82334804, "99.00 percentile latency (ns)": 96149085, "99.90 percentile latency (ns)": 108694817, "Max latency (ns)": 117254487, "Mean latency (ns)": 60072796, "Min duration satisfied": "Yes", "Min latency (ns)": 50053064, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.64, "QPS w/o loadgen overhead": 16.65, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 72.084529, "characteristics.90th_percentile_latency_ns": 72084529.0, "characteristics.90th_percentile_latency_s": 0.072084529, "characteristics.90th_percentile_latency_us": 72084.529, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 1.3344915474902863, "characteristics.power.normalized_per_core": 0.1668114434362858, "characteristics.power.normalized_per_processor": 1.3344915474902863, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.05-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.05 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.0-fan.cool-armnn-v21.05-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.05-neon", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.5, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "29cb3424da2ed5c4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 152211465, "90.00 percentile latency (ns)": 212559896, "90th percentile latency (ns)": 212559896, "95.00 percentile latency (ns)": 219302600, "97.00 percentile latency (ns)": 222617713, "99.00 percentile latency (ns)": 230715347, "99.90 percentile latency (ns)": 245439769, "Max latency (ns)": 249286150, "Mean latency (ns)": 166880905, "Min duration satisfied": "Yes", "Min latency (ns)": 127849877, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.99, "QPS w/o loadgen overhead": 5.99, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 212.559896, "characteristics.90th_percentile_latency_ns": 212559896.0, "characteristics.90th_percentile_latency_s": 0.212559896, "characteristics.90th_percentile_latency_us": 212559.896, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 1.6442958126585818, "characteristics.power.normalized_per_core": 0.20553697658232273, "characteristics.power.normalized_per_processor": 1.6442958126585818, "characteristics.total": 50000, "ck_system": "xavier-power.5-fan.cool-armnn-v21.05-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.05 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_30W_4CORE", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.5-fan.cool-armnn-v21.05-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.5-fan.cool-armnn-v21.05-neon", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "4438401e8744f202", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 460391961, "90.00 percentile latency (ns)": 513365769, "90th percentile latency (ns)": 513365769, "95.00 percentile latency (ns)": 540086550, "97.00 percentile latency (ns)": 566083793, "99.00 percentile latency (ns)": 599433317, "99.90 percentile latency (ns)": 629419677, "Max latency (ns)": 636100157, "Mean latency (ns)": 468588937, "Min duration satisfied": "Yes", "Min latency (ns)": 410442585, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.13, "QPS w/o loadgen overhead": 2.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 513.365769, "characteristics.90th_percentile_latency_ns": 513365769.0, "characteristics.90th_percentile_latency_s": 0.513365769, "characteristics.90th_percentile_latency_us": 513365.769, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/firefly-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.5.0-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "e33fc45c5ab99214", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 297026104, "90.00 percentile latency (ns)": 312576717, "90th percentile latency (ns)": 312576717, "95.00 percentile latency (ns)": 314930190, "97.00 percentile latency (ns)": 316858971, "99.00 percentile latency (ns)": 353617842, "99.90 percentile latency (ns)": 400217240, "Max latency (ns)": 409538342, "Mean latency (ns)": 301115888, "Min duration satisfied": "Yes", "Min latency (ns)": 292298589, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.32, "QPS w/o loadgen overhead": 3.32, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 312.576717, "characteristics.90th_percentile_latency_ns": 312576717.0, "characteristics.90th_percentile_latency_s": 0.312576717, "characteristics.90th_percentile_latency_us": 312576.717, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.off-armnn-v21.05-neon", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan off", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.05 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/rpi4coral-fan.off-armnn-v21.05-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.off-armnn-v21.05-neon", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "16517d80da4c57a1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 261222673, "90.00 percentile latency (ns)": 295216100, "90th percentile latency (ns)": 295216100, "95.00 percentile latency (ns)": 302924911, "97.00 percentile latency (ns)": 309871259, "99.00 percentile latency (ns)": 318383207, "99.90 percentile latency (ns)": 341641653, "Max latency (ns)": 371321129, "Mean latency (ns)": 253421870, "Min duration satisfied": "Yes", "Min latency (ns)": 205252846, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.95, "QPS w/o loadgen overhead": 3.95, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 295.2161, "characteristics.90th_percentile_latency_ns": 295216100.0, "characteristics.90th_percentile_latency_s": 0.2952161, "characteristics.90th_percentile_latency_us": 295216.1, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 2.31252436746849, "characteristics.power.normalized_per_core": 0.28906554593356126, "characteristics.power.normalized_per_processor": 2.31252436746849, "characteristics.total": 50000, "ck_system": "xavier-power.4-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_30W_6CORE", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.4-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.4-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "082a8530d5d0f52c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 536148159, "90.00 percentile latency (ns)": 552886733, "90th percentile latency (ns)": 552886733, "95.00 percentile latency (ns)": 557881108, "97.00 percentile latency (ns)": 573400901, "99.00 percentile latency (ns)": 652675954, "99.90 percentile latency (ns)": 797214609, "Max latency (ns)": 827329240, "Mean latency (ns)": 539672784, "Min duration satisfied": "Yes", "Min latency (ns)": 518672689, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.85, "QPS w/o loadgen overhead": 1.85, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 552.886733, "characteristics.90th_percentile_latency_ns": 552886733.0, "characteristics.90th_percentile_latency_s": 0.552886733, "characteristics.90th_percentile_latency_us": 552886.733, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.off-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan off", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/rpi4coral-fan.off-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.off-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "6b34c5a496185c90", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 246667258, "90.00 percentile latency (ns)": 377539337, "90th percentile latency (ns)": 377539337, "95.00 percentile latency (ns)": 384879527, "97.00 percentile latency (ns)": 390054264, "99.00 percentile latency (ns)": 396472655, "99.90 percentile latency (ns)": 401502604, "Max latency (ns)": 403894558, "Mean latency (ns)": 278242763, "Min duration satisfied": "Yes", "Min latency (ns)": 205223095, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.59, "QPS w/o loadgen overhead": 3.59, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 377.539337, "characteristics.90th_percentile_latency_ns": 377539337.0, "characteristics.90th_percentile_latency_s": 0.377539337, "characteristics.90th_percentile_latency_us": 377539.337, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 2.111835345838655, "characteristics.power.normalized_per_core": 0.2639794182298319, "characteristics.power.normalized_per_processor": 2.111835345838655, "characteristics.total": 50000, "ck_system": "xavier-power.2-fan.cool-armnn-v21.05-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.05 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_15W", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.2-fan.cool-armnn-v21.05-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.2-fan.cool-armnn-v21.05-neon", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "54c308a2ef6a9c20", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 295843908, "90.00 percentile latency (ns)": 311639597, "90th percentile latency (ns)": 311639597, "95.00 percentile latency (ns)": 314241209, "97.00 percentile latency (ns)": 316654917, "99.00 percentile latency (ns)": 378801909, "99.90 percentile latency (ns)": 440793201, "Max latency (ns)": 440983308, "Mean latency (ns)": 300423447, "Min duration satisfied": "Yes", "Min latency (ns)": 291046324, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.33, "QPS w/o loadgen overhead": 3.33, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 311.639597, "characteristics.90th_percentile_latency_ns": 311639597.0, "characteristics.90th_percentile_latency_s": 0.311639597, "characteristics.90th_percentile_latency_us": 311639.597, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.05-neon", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.05 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/rpi4coral-fan.on-armnn-v21.05-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.05-neon", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "f7efe0e377e4402b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 232293726, "90.00 percentile latency (ns)": 300953697, "90th percentile latency (ns)": 300953697, "95.00 percentile latency (ns)": 315414475, "97.00 percentile latency (ns)": 321732839, "99.00 percentile latency (ns)": 336250947, "99.90 percentile latency (ns)": 359908564, "Max latency (ns)": 362011346, "Mean latency (ns)": 240223220, "Min duration satisfied": "Yes", "Min latency (ns)": 184048192, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.16, "QPS w/o loadgen overhead": 4.16, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 300.953697, "characteristics.90th_percentile_latency_ns": 300953697.0, "characteristics.90th_percentile_latency_s": 0.300953697, "characteristics.90th_percentile_latency_us": 300953.697, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 2.3176000871528792, "characteristics.power.normalized_per_core": 0.2897000108941099, "characteristics.power.normalized_per_processor": 2.3176000871528792, "characteristics.total": 50000, "ck_system": "xavier-power.3-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_30W_ALL", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.3-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.3-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "970334e3bac4d3ba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 522491675, "90.00 percentile latency (ns)": 537899368, "90th percentile latency (ns)": 537899368, "95.00 percentile latency (ns)": 541278241, "97.00 percentile latency (ns)": 544734426, "99.00 percentile latency (ns)": 565368105, "99.90 percentile latency (ns)": 647591910, "Max latency (ns)": 651126173, "Mean latency (ns)": 527419333, "Min duration satisfied": "Yes", "Min latency (ns)": 516095950, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.9, "QPS w/o loadgen overhead": 1.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 537.899368, "characteristics.90th_percentile_latency_ns": 537899368.0, "characteristics.90th_percentile_latency_s": 0.537899368, "characteristics.90th_percentile_latency_us": 537899.368, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "http://raspberrypiwiki.com/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/rpi4coral-fan.on-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.5.0-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "5b5381b2d8408486", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 236424870, "90.00 percentile latency (ns)": 264464129, "90th percentile latency (ns)": 264464129, "95.00 percentile latency (ns)": 271275991, "97.00 percentile latency (ns)": 276331724, "99.00 percentile latency (ns)": 287053312, "99.90 percentile latency (ns)": 302183430, "Max latency (ns)": 303749442, "Mean latency (ns)": 231711676, "Min duration satisfied": "Yes", "Min latency (ns)": 196787152, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.31, "QPS w/o loadgen overhead": 4.32, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 264.464129, "characteristics.90th_percentile_latency_ns": 264464129.0, "characteristics.90th_percentile_latency_s": 0.264464129, "characteristics.90th_percentile_latency_us": 264464.129, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 2.497844283543104, "characteristics.power.normalized_per_core": 0.312230535442888, "characteristics.power.normalized_per_processor": 2.497844283543104, "characteristics.total": 50000, "ck_system": "xavier-power.5-fan.cool-tflite-v2.5.0-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.5.0 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MODE_30W_4CORE", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.1, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.1/tree/master/closed/Krai/results/xavier-power.5-fan.cool-tflite-v2.5.0-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 1624344308455410291, "retraining": "no", "sample_index_rng_seed": 517984244576520566, "samples_per_query": 1, "schedule_rng_seed": 10051496985653635065, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.5", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.5-fan.cool-tflite-v2.5.0-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.33333, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "6a6b370c1da90ee7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 26927247, "90.00 percentile latency (ns)": 31318871, "90th percentile latency (ns)": 31318871, "95.00 percentile latency (ns)": 36899930, "97.00 percentile latency (ns)": 37587758, "99.00 percentile latency (ns)": 39058015, "99.90 percentile latency (ns)": 44301556, "Max latency (ns)": 51836597, "Mean latency (ns)": 27981780, "Min duration satisfied": "Yes", "Min latency (ns)": 26396996, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 35.72, "QPS w/o loadgen overhead": 35.74, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 31.318871, "characteristics.90th_percentile_latency_ns": 31318871.0, "characteristics.90th_percentile_latency_s": 0.031318871, "characteristics.90th_percentile_latency_us": 31318.871, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.power": 0.18592469617265733, "characteristics.power.normalized_per_core": 0.0015493724681054778, "characteristics.power.normalized_per_processor": 0.18592469617265733, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 32.2581, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "46d45aeb69da0bf1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 37627723, "90.00 percentile latency (ns)": 46434374, "90th percentile latency (ns)": 46434374, "95.00 percentile latency (ns)": 52318768, "97.00 percentile latency (ns)": 53135478, "99.00 percentile latency (ns)": 55435496, "99.90 percentile latency (ns)": 61709697, "Max latency (ns)": 70013998, "Mean latency (ns)": 39312984, "Min duration satisfied": "Yes", "Min latency (ns)": 36530434, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 25.43, "QPS w/o loadgen overhead": 25.44, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 46.434374, "characteristics.90th_percentile_latency_ns": 46434374.0, "characteristics.90th_percentile_latency_s": 0.046434374, "characteristics.90th_percentile_latency_us": 46434.374, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.power": 0.24613309317151322, "characteristics.power.normalized_per_core": 0.00205110910976261, "characteristics.power.normalized_per_processor": 0.24613309317151322, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.7273, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "178d135c764b5188", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 498359029, "90.00 percentile latency (ns)": 516635786, "90th percentile latency (ns)": 516635786, "95.00 percentile latency (ns)": 564303750, "97.00 percentile latency (ns)": 625818939, "99.00 percentile latency (ns)": 643976624, "99.90 percentile latency (ns)": 654377556, "Max latency (ns)": 665401222, "Mean latency (ns)": 503697151, "Min duration satisfied": "Yes", "Min latency (ns)": 482237105, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.99, "QPS w/o loadgen overhead": 1.99, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 516.635786, "characteristics.90th_percentile_latency_ns": 516635786.0, "characteristics.90th_percentile_latency_s": 0.516635786, "characteristics.90th_percentile_latency_us": 516635.786, "characteristics.accuracy": 78.564, "characteristics.good": 39282, "characteristics.power": 3.6418598188806097, "characteristics.power.normalized_per_core": 0.030348831824005083, "characteristics.power.normalized_per_processor": 3.6418598188806097, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.99601, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "61e9404257bdcf9b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14891023, "90.00 percentile latency (ns)": 18782367, "90th percentile latency (ns)": 18782367, "95.00 percentile latency (ns)": 22197527, "97.00 percentile latency (ns)": 23125107, "99.00 percentile latency (ns)": 24320693, "99.90 percentile latency (ns)": 28601603, "Max latency (ns)": 35321197, "Mean latency (ns)": 15878773, "Min duration satisfied": "Yes", "Min latency (ns)": 14269250, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.91, "QPS w/o loadgen overhead": 62.98, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.782367, "characteristics.90th_percentile_latency_ns": 18782367.0, "characteristics.90th_percentile_latency_s": 0.018782367, "characteristics.90th_percentile_latency_us": 18782.367, "characteristics.accuracy": 63.65, "characteristics.good": 31825, "characteristics.power": 0.10165405908897997, "characteristics.power.normalized_per_core": 0.000847117159074833, "characteristics.power.normalized_per_processor": 0.10165405908897997, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "16c14c0ab8aa1775", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8749586, "90.00 percentile latency (ns)": 10462162, "90th percentile latency (ns)": 10462162, "95.00 percentile latency (ns)": 11151223, "97.00 percentile latency (ns)": 11377209, "99.00 percentile latency (ns)": 12189591, "99.90 percentile latency (ns)": 15189910, "Max latency (ns)": 31910061, "Mean latency (ns)": 9131376, "Min duration satisfied": "Yes", "Min latency (ns)": 8402161, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 109.35, "QPS w/o loadgen overhead": 109.51, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.462162, "characteristics.90th_percentile_latency_ns": 10462162.0, "characteristics.90th_percentile_latency_s": 0.010462162, "characteristics.90th_percentile_latency_us": 10462.162, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.power": 0.05198523382320212, "characteristics.power.normalized_per_core": 0.0004332102818600177, "characteristics.power.normalized_per_processor": 0.05198523382320212, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dd6efb4934416a02", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10102440, "90.00 percentile latency (ns)": 12444369, "90th percentile latency (ns)": 12444369, "95.00 percentile latency (ns)": 13431346, "97.00 percentile latency (ns)": 13768284, "99.00 percentile latency (ns)": 14728799, "99.90 percentile latency (ns)": 17806397, "Max latency (ns)": 25568945, "Mean latency (ns)": 10511273, "Min duration satisfied": "Yes", "Min latency (ns)": 9782114, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 95.01, "QPS w/o loadgen overhead": 95.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.444369, "characteristics.90th_percentile_latency_ns": 12444369.0, "characteristics.90th_percentile_latency_s": 0.012444369, "characteristics.90th_percentile_latency_us": 12444.369, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.power": 0.06156319884024529, "characteristics.power.normalized_per_core": 0.0005130266570020441, "characteristics.power.normalized_per_processor": 0.06156319884024529, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "82e6c3d588146d4a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20505581, "90.00 percentile latency (ns)": 23797225, "90th percentile latency (ns)": 23797225, "95.00 percentile latency (ns)": 25556720, "97.00 percentile latency (ns)": 26072857, "99.00 percentile latency (ns)": 27351823, "99.90 percentile latency (ns)": 31341045, "Max latency (ns)": 43238571, "Mean latency (ns)": 21171119, "Min duration satisfied": "Yes", "Min latency (ns)": 19918969, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 47.2, "QPS w/o loadgen overhead": 47.23, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.797225, "characteristics.90th_percentile_latency_ns": 23797225.0, "characteristics.90th_percentile_latency_s": 0.023797225, "characteristics.90th_percentile_latency_us": 23797.225, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.power": 0.12239772029068445, "characteristics.power.normalized_per_core": 0.0010199810024223703, "characteristics.power.normalized_per_processor": 0.12239772029068445, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4468baa8959a8bdd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5289071, "90.00 percentile latency (ns)": 7157948, "90th percentile latency (ns)": 7157948, "95.00 percentile latency (ns)": 7497352, "97.00 percentile latency (ns)": 7691836, "99.00 percentile latency (ns)": 8236642, "99.90 percentile latency (ns)": 10976871, "Max latency (ns)": 25998535, "Mean latency (ns)": 5588792, "Min duration satisfied": "Yes", "Min latency (ns)": 4845589, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 178.42, "QPS w/o loadgen overhead": 178.93, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.157948, "characteristics.90th_percentile_latency_ns": 7157948.0, "characteristics.90th_percentile_latency_s": 0.007157948, "characteristics.90th_percentile_latency_us": 7157.948, "characteristics.accuracy": 48.114, "characteristics.good": 24057, "characteristics.power": 0.034173280126739265, "characteristics.power.normalized_per_core": 0.00028477733438949385, "characteristics.power.normalized_per_processor": 0.034173280126739265, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e7bb7ed4927633b4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 59144569, "90.00 percentile latency (ns)": 71464601, "90th percentile latency (ns)": 71464601, "95.00 percentile latency (ns)": 76529591, "97.00 percentile latency (ns)": 85739377, "99.00 percentile latency (ns)": 88612379, "99.90 percentile latency (ns)": 94565119, "Max latency (ns)": 97195341, "Mean latency (ns)": 61649435, "Min duration satisfied": "Yes", "Min latency (ns)": 57689219, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.22, "QPS w/o loadgen overhead": 16.22, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 71.464601, "characteristics.90th_percentile_latency_ns": 71464601.0, "characteristics.90th_percentile_latency_s": 0.071464601, "characteristics.90th_percentile_latency_us": 71464.601, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.power": 0.3946421817703448, "characteristics.power.normalized_per_core": 0.0032886848480862068, "characteristics.power.normalized_per_processor": 0.3946421817703448, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.873, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4ca6be7a0b7df1e2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6636900, "90.00 percentile latency (ns)": 9143266, "90th percentile latency (ns)": 9143266, "95.00 percentile latency (ns)": 9517443, "97.00 percentile latency (ns)": 9755771, "99.00 percentile latency (ns)": 10361053, "99.90 percentile latency (ns)": 13243985, "Max latency (ns)": 29047484, "Mean latency (ns)": 7112955, "Min duration satisfied": "Yes", "Min latency (ns)": 6118948, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 140.28, "QPS w/o loadgen overhead": 140.59, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.143266, "characteristics.90th_percentile_latency_ns": 9143266.0, "characteristics.90th_percentile_latency_s": 0.009143266, "characteristics.90th_percentile_latency_us": 9143.266, "characteristics.accuracy": 50.164, "characteristics.good": 25082, "characteristics.power": 0.04381100719492835, "characteristics.power.normalized_per_core": 0.0003650917266244029, "characteristics.power.normalized_per_processor": 0.04381100719492835, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "026ad6e0c8a79506", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12020698, "90.00 percentile latency (ns)": 16047213, "90th percentile latency (ns)": 16047213, "95.00 percentile latency (ns)": 17045701, "97.00 percentile latency (ns)": 17494015, "99.00 percentile latency (ns)": 18502404, "99.90 percentile latency (ns)": 22119244, "Max latency (ns)": 38053573, "Mean latency (ns)": 12657154, "Min duration satisfied": "Yes", "Min latency (ns)": 11420028, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 78.91, "QPS w/o loadgen overhead": 79.01, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.047213, "characteristics.90th_percentile_latency_ns": 16047213.0, "characteristics.90th_percentile_latency_s": 0.016047213, "characteristics.90th_percentile_latency_us": 16047.213, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.power": 0.0779310554574866, "characteristics.power.normalized_per_core": 0.0006494254621457217, "characteristics.power.normalized_per_processor": 0.0779310554574866, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7c49aab6eefe28d8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 27327896, "90.00 percentile latency (ns)": 33920720, "90th percentile latency (ns)": 33920720, "95.00 percentile latency (ns)": 38656213, "97.00 percentile latency (ns)": 39449292, "99.00 percentile latency (ns)": 41234345, "99.90 percentile latency (ns)": 47924800, "Max latency (ns)": 58759200, "Mean latency (ns)": 28718924, "Min duration satisfied": "Yes", "Min latency (ns)": 26710854, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.8, "QPS w/o loadgen overhead": 34.82, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.92072, "characteristics.90th_percentile_latency_ns": 33920720.0, "characteristics.90th_percentile_latency_s": 0.03392072, "characteristics.90th_percentile_latency_us": 33920.72, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.power": 0.17947760121835607, "characteristics.power.normalized_per_core": 0.001495646676819634, "characteristics.power.normalized_per_processor": 0.17947760121835607, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 30.303, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c69de88920854d71", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 152988394, "90.00 percentile latency (ns)": 170100605, "90th percentile latency (ns)": 170100605, "95.00 percentile latency (ns)": 175787610, "97.00 percentile latency (ns)": 186616807, "99.00 percentile latency (ns)": 250991789, "99.90 percentile latency (ns)": 287867102, "Max latency (ns)": 293596238, "Mean latency (ns)": 159485998, "Min duration satisfied": "Yes", "Min latency (ns)": 151451151, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 6.27, "QPS w/o loadgen overhead": 6.27, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 170.100605, "characteristics.90th_percentile_latency_ns": 170100605.0, "characteristics.90th_percentile_latency_s": 0.170100605, "characteristics.90th_percentile_latency_us": 170100.605, "characteristics.accuracy": 74.116, "characteristics.good": 37058, "characteristics.power": 1.1525501135906304, "characteristics.power.normalized_per_core": 0.00960458427992192, "characteristics.power.normalized_per_processor": 1.1525501135906304, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 6.32911, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f3b0e21a4c8a8cda", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11709220, "90.00 percentile latency (ns)": 16882439, "90th percentile latency (ns)": 16882439, "95.00 percentile latency (ns)": 17419722, "97.00 percentile latency (ns)": 17932100, "99.00 percentile latency (ns)": 18979187, "99.90 percentile latency (ns)": 22676605, "Max latency (ns)": 37461848, "Mean latency (ns)": 12701595, "Min duration satisfied": "Yes", "Min latency (ns)": 10973866, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 78.63, "QPS w/o loadgen overhead": 78.73, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.882439, "characteristics.90th_percentile_latency_ns": 16882439.0, "characteristics.90th_percentile_latency_s": 0.016882439, "characteristics.90th_percentile_latency_us": 16882.439, "characteristics.accuracy": 61.948, "characteristics.good": 30974, "characteristics.power": 0.07964215916943285, "characteristics.power.normalized_per_core": 0.0006636846597452737, "characteristics.power.normalized_per_processor": 0.07964215916943285, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4dea15b3e35cd369", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12597697, "90.00 percentile latency (ns)": 16986375, "90th percentile latency (ns)": 16986375, "95.00 percentile latency (ns)": 19608564, "97.00 percentile latency (ns)": 20369396, "99.00 percentile latency (ns)": 21377480, "99.90 percentile latency (ns)": 24588830, "Max latency (ns)": 39851963, "Mean latency (ns)": 13446964, "Min duration satisfied": "Yes", "Min latency (ns)": 12000483, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 74.27, "QPS w/o loadgen overhead": 74.37, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.986375, "characteristics.90th_percentile_latency_ns": 16986375.0, "characteristics.90th_percentile_latency_s": 0.016986375, "characteristics.90th_percentile_latency_us": 16986.375, "characteristics.accuracy": 62.264, "characteristics.good": 31132, "characteristics.power": 0.08924257499280823, "characteristics.power.normalized_per_core": 0.0007436881249400685, "characteristics.power.normalized_per_processor": 0.08924257499280823, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "fbc225527c877359", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6618888, "90.00 percentile latency (ns)": 9243242, "90th percentile latency (ns)": 9243242, "95.00 percentile latency (ns)": 9492255, "97.00 percentile latency (ns)": 9706383, "99.00 percentile latency (ns)": 10525902, "99.90 percentile latency (ns)": 13955963, "Max latency (ns)": 34805199, "Mean latency (ns)": 7100938, "Min duration satisfied": "Yes", "Min latency (ns)": 5849422, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 140.48, "QPS w/o loadgen overhead": 140.83, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.243242, "characteristics.90th_percentile_latency_ns": 9243242.0, "characteristics.90th_percentile_latency_s": 0.009243242, "characteristics.90th_percentile_latency_us": 9243.242, "characteristics.accuracy": 49.19, "characteristics.good": 24595, "characteristics.power": 0.04276269115326649, "characteristics.power.normalized_per_core": 0.0003563557596105541, "characteristics.power.normalized_per_processor": 0.04276269115326649, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "465d9015802cbdb3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 43137508, "90.00 percentile latency (ns)": 53278250, "90th percentile latency (ns)": 53278250, "95.00 percentile latency (ns)": 60198243, "97.00 percentile latency (ns)": 71878060, "99.00 percentile latency (ns)": 76373094, "99.90 percentile latency (ns)": 82700434, "Max latency (ns)": 110627829, "Mean latency (ns)": 45906890, "Min duration satisfied": "Yes", "Min latency (ns)": 42209416, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.78, "QPS w/o loadgen overhead": 21.78, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 53.27825, "characteristics.90th_percentile_latency_ns": 53278250.0, "characteristics.90th_percentile_latency_s": 0.05327825, "characteristics.90th_percentile_latency_us": 53278.25, "characteristics.accuracy": 73.556, "characteristics.good": 36778, "characteristics.power": 0.3224938347577304, "characteristics.power.normalized_per_core": 0.0026874486229810867, "characteristics.power.normalized_per_processor": 0.3224938347577304, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "eb4dcead3dfff2ad", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 30656406, "90.00 percentile latency (ns)": 34205190, "90th percentile latency (ns)": 34205190, "95.00 percentile latency (ns)": 44303161, "97.00 percentile latency (ns)": 46621949, "99.00 percentile latency (ns)": 54597868, "99.90 percentile latency (ns)": 58658717, "Max latency (ns)": 65067297, "Mean latency (ns)": 32167271, "Min duration satisfied": "Yes", "Min latency (ns)": 30283265, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 31.07, "QPS w/o loadgen overhead": 31.09, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 34.20519, "characteristics.90th_percentile_latency_ns": 34205190.0, "characteristics.90th_percentile_latency_s": 0.03420519, "characteristics.90th_percentile_latency_us": 34205.19, "characteristics.accuracy": 70.764, "characteristics.good": 35382, "characteristics.power": 0.23218113353287656, "characteristics.power.normalized_per_core": 0.001934842779440638, "characteristics.power.normalized_per_processor": 0.23218113353287656, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 30.303, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1191ca0b846d1847", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7296050, "90.00 percentile latency (ns)": 8689239, "90th percentile latency (ns)": 8689239, "95.00 percentile latency (ns)": 8970309, "97.00 percentile latency (ns)": 9202259, "99.00 percentile latency (ns)": 9791879, "99.90 percentile latency (ns)": 13276972, "Max latency (ns)": 29382676, "Mean latency (ns)": 7618541, "Min duration satisfied": "Yes", "Min latency (ns)": 6820477, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 131.01, "QPS w/o loadgen overhead": 131.26, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.689239, "characteristics.90th_percentile_latency_ns": 8689239.0, "characteristics.90th_percentile_latency_s": 0.008689239, "characteristics.90th_percentile_latency_us": 8689.239, "characteristics.accuracy": 47.81, "characteristics.good": 23905, "characteristics.power": 0.042823466251424816, "characteristics.power.normalized_per_core": 0.00035686221876187347, "characteristics.power.normalized_per_processor": 0.042823466251424816, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "14350616cc43e19f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16977052, "90.00 percentile latency (ns)": 20478638, "90th percentile latency (ns)": 20478638, "95.00 percentile latency (ns)": 22495397, "97.00 percentile latency (ns)": 23098616, "99.00 percentile latency (ns)": 24420640, "99.90 percentile latency (ns)": 28977627, "Max latency (ns)": 36954772, "Mean latency (ns)": 17707605, "Min duration satisfied": "Yes", "Min latency (ns)": 16360272, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 56.42, "QPS w/o loadgen overhead": 56.47, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.478638, "characteristics.90th_percentile_latency_ns": 20478638.0, "characteristics.90th_percentile_latency_s": 0.020478638, "characteristics.90th_percentile_latency_us": 20478.638, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.power": 0.10730713380146079, "characteristics.power.normalized_per_core": 0.0008942261150121732, "characteristics.power.normalized_per_processor": 0.10730713380146079, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "663ef858d3418b98", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12682246, "90.00 percentile latency (ns)": 14392910, "90th percentile latency (ns)": 14392910, "95.00 percentile latency (ns)": 15802799, "97.00 percentile latency (ns)": 16139445, "99.00 percentile latency (ns)": 16926959, "99.90 percentile latency (ns)": 19844673, "Max latency (ns)": 37163098, "Mean latency (ns)": 13052287, "Min duration satisfied": "Yes", "Min latency (ns)": 12110961, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 76.53, "QPS w/o loadgen overhead": 76.61, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.39291, "characteristics.90th_percentile_latency_ns": 14392910.0, "characteristics.90th_percentile_latency_s": 0.01439291, "characteristics.90th_percentile_latency_us": 14392.91, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.power": 0.07393776009882569, "characteristics.power.normalized_per_core": 0.0006161480008235475, "characteristics.power.normalized_per_processor": 0.07393776009882569, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "194f7596d37ffd78", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9290274, "90.00 percentile latency (ns)": 13364758, "90th percentile latency (ns)": 13364758, "95.00 percentile latency (ns)": 13711323, "97.00 percentile latency (ns)": 14180017, "99.00 percentile latency (ns)": 15048553, "99.90 percentile latency (ns)": 18320091, "Max latency (ns)": 33146019, "Mean latency (ns)": 10225364, "Min duration satisfied": "Yes", "Min latency (ns)": 8588437, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 97.63, "QPS w/o loadgen overhead": 97.8, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.364758, "characteristics.90th_percentile_latency_ns": 13364758.0, "characteristics.90th_percentile_latency_s": 0.013364758, "characteristics.90th_percentile_latency_us": 13364.758, "characteristics.accuracy": 59.232, "characteristics.good": 29616, "characteristics.power": 0.06281086374027967, "characteristics.power.normalized_per_core": 0.0005234238645023306, "characteristics.power.normalized_per_processor": 0.06281086374027967, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4c893aaba41d49e3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 17534110, "90.00 percentile latency (ns)": 21032703, "90th percentile latency (ns)": 21032703, "95.00 percentile latency (ns)": 25948411, "97.00 percentile latency (ns)": 29392215, "99.00 percentile latency (ns)": 30886073, "99.90 percentile latency (ns)": 33981567, "Max latency (ns)": 39664323, "Mean latency (ns)": 18652872, "Min duration satisfied": "Yes", "Min latency (ns)": 16579221, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 53.56, "QPS w/o loadgen overhead": 53.61, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.032703, "characteristics.90th_percentile_latency_ns": 21032703.0, "characteristics.90th_percentile_latency_s": 0.021032703, "characteristics.90th_percentile_latency_us": 21032.703, "characteristics.accuracy": 68.212, "characteristics.good": 34106, "characteristics.power": 0.12860250948118873, "characteristics.power.normalized_per_core": 0.0010716875790099062, "characteristics.power.normalized_per_processor": 0.12860250948118873, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 52.6316, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "174f37af11d1eef8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8610990, "90.00 percentile latency (ns)": 11372093, "90th percentile latency (ns)": 11372093, "95.00 percentile latency (ns)": 11821080, "97.00 percentile latency (ns)": 12251332, "99.00 percentile latency (ns)": 13339693, "99.90 percentile latency (ns)": 16973966, "Max latency (ns)": 25976123, "Mean latency (ns)": 9255328, "Min duration satisfied": "Yes", "Min latency (ns)": 7965207, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 107.84, "QPS w/o loadgen overhead": 108.05, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.372093, "characteristics.90th_percentile_latency_ns": 11372093.0, "characteristics.90th_percentile_latency_s": 0.011372093, "characteristics.90th_percentile_latency_us": 11372.093, "characteristics.accuracy": 59.072, "characteristics.good": 29536, "characteristics.power": 0.0571775851144389, "characteristics.power.normalized_per_core": 0.0004764798759536575, "characteristics.power.normalized_per_processor": 0.0571775851144389, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9517e3c432fb10c3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8254027, "90.00 percentile latency (ns)": 12691292, "90th percentile latency (ns)": 12691292, "95.00 percentile latency (ns)": 12983100, "97.00 percentile latency (ns)": 13371719, "99.00 percentile latency (ns)": 14138079, "99.90 percentile latency (ns)": 17003326, "Max latency (ns)": 32488732, "Mean latency (ns)": 9153424, "Min duration satisfied": "Yes", "Min latency (ns)": 7520685, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 109.06, "QPS w/o loadgen overhead": 109.25, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.691292, "characteristics.90th_percentile_latency_ns": 12691292.0, "characteristics.90th_percentile_latency_s": 0.012691292, "characteristics.90th_percentile_latency_us": 12691.292, "characteristics.accuracy": 58.386, "characteristics.good": 29193, "characteristics.power": 0.05951367939089962, "characteristics.power.normalized_per_core": 0.0004959473282574969, "characteristics.power.normalized_per_processor": 0.05951367939089962, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b7921f70f9401321", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 29006683, "90.00 percentile latency (ns)": 35020575, "90th percentile latency (ns)": 35020575, "95.00 percentile latency (ns)": 41486092, "97.00 percentile latency (ns)": 45110531, "99.00 percentile latency (ns)": 49006515, "99.90 percentile latency (ns)": 53904049, "Max latency (ns)": 62887955, "Mean latency (ns)": 30676935, "Min duration satisfied": "Yes", "Min latency (ns)": 28307786, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 32.58, "QPS w/o loadgen overhead": 32.6, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 35.020575, "characteristics.90th_percentile_latency_ns": 35020575.0, "characteristics.90th_percentile_latency_s": 0.035020575, "characteristics.90th_percentile_latency_us": 35020.575, "characteristics.accuracy": 72.894, "characteristics.good": 36447, "characteristics.power": 0.20262032725698947, "characteristics.power.normalized_per_core": 0.0016885027271415789, "characteristics.power.normalized_per_processor": 0.20262032725698947, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 31.25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "326a08caa6c24ae3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 27934526, "90.00 percentile latency (ns)": 33059172, "90th percentile latency (ns)": 33059172, "95.00 percentile latency (ns)": 40601081, "97.00 percentile latency (ns)": 44430177, "99.00 percentile latency (ns)": 48324479, "99.90 percentile latency (ns)": 53204390, "Max latency (ns)": 59000413, "Mean latency (ns)": 29441204, "Min duration satisfied": "Yes", "Min latency (ns)": 27347022, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 33.95, "QPS w/o loadgen overhead": 33.97, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.059172, "characteristics.90th_percentile_latency_ns": 33059172.0, "characteristics.90th_percentile_latency_s": 0.033059172, "characteristics.90th_percentile_latency_us": 33059.172, "characteristics.accuracy": 70.598, "characteristics.good": 35299, "characteristics.power": 0.20359950863569765, "characteristics.power.normalized_per_core": 0.001696662571964147, "characteristics.power.normalized_per_processor": 0.20359950863569765, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 33.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "adce3e4a799f05ae", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10814881, "90.00 percentile latency (ns)": 15482329, "90th percentile latency (ns)": 15482329, "95.00 percentile latency (ns)": 15992819, "97.00 percentile latency (ns)": 16537525, "99.00 percentile latency (ns)": 17471709, "99.90 percentile latency (ns)": 20885840, "Max latency (ns)": 29647880, "Mean latency (ns)": 11678856, "Min duration satisfied": "Yes", "Min latency (ns)": 10211220, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 85.5, "QPS w/o loadgen overhead": 85.62, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.482329, "characteristics.90th_percentile_latency_ns": 15482329.0, "characteristics.90th_percentile_latency_s": 0.015482329, "characteristics.90th_percentile_latency_us": 15482.329, "characteristics.accuracy": 56.522, "characteristics.good": 28261, "characteristics.power": 0.07334574690810763, "characteristics.power.normalized_per_core": 0.0006112145575675636, "characteristics.power.normalized_per_processor": 0.07334574690810763, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "149171cc31494fb8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16487462, "90.00 percentile latency (ns)": 23432752, "90th percentile latency (ns)": 23432752, "95.00 percentile latency (ns)": 25982395, "97.00 percentile latency (ns)": 26996327, "99.00 percentile latency (ns)": 28219733, "99.90 percentile latency (ns)": 32237261, "Max latency (ns)": 40756756, "Mean latency (ns)": 18095170, "Min duration satisfied": "Yes", "Min latency (ns)": 15526585, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 55.21, "QPS w/o loadgen overhead": 55.26, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.432752, "characteristics.90th_percentile_latency_ns": 23432752.0, "characteristics.90th_percentile_latency_s": 0.023432752, "characteristics.90th_percentile_latency_us": 23432.752, "characteristics.accuracy": 67.726, "characteristics.good": 33863, "characteristics.power": 0.11795334369388785, "characteristics.power.normalized_per_core": 0.0009829445307823989, "characteristics.power.normalized_per_processor": 0.11795334369388785, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 52.6316, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "857aef6e560939c1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5060595, "90.00 percentile latency (ns)": 6105979, "90th percentile latency (ns)": 6105979, "95.00 percentile latency (ns)": 6251628, "97.00 percentile latency (ns)": 6407953, "99.00 percentile latency (ns)": 6831296, "99.90 percentile latency (ns)": 10104444, "Max latency (ns)": 27148890, "Mean latency (ns)": 5291032, "Min duration satisfied": "Yes", "Min latency (ns)": 4840011, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 188.51, "QPS w/o loadgen overhead": 189.0, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.105979, "characteristics.90th_percentile_latency_ns": 6105979.0, "characteristics.90th_percentile_latency_s": 0.006105979, "characteristics.90th_percentile_latency_us": 6105.979, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.power": 0.02947726356441105, "characteristics.power.normalized_per_core": 0.00024564386303675874, "characteristics.power.normalized_per_processor": 0.02947726356441105, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4d9dbd38281340f6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 4202050, "90.00 percentile latency (ns)": 5737830, "90th percentile latency (ns)": 5737830, "95.00 percentile latency (ns)": 5914721, "97.00 percentile latency (ns)": 6053439, "99.00 percentile latency (ns)": 6482960, "99.90 percentile latency (ns)": 9505746, "Max latency (ns)": 25911158, "Mean latency (ns)": 4529575, "Min duration satisfied": "Yes", "Min latency (ns)": 3851577, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 220.04, "QPS w/o loadgen overhead": 220.77, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.73783, "characteristics.90th_percentile_latency_ns": 5737830.0, "characteristics.90th_percentile_latency_s": 0.00573783, "characteristics.90th_percentile_latency_us": 5737.83, "characteristics.accuracy": 45.444, "characteristics.good": 22722, "characteristics.power": 0.027150546186089516, "characteristics.power.normalized_per_core": 0.00022625455155074597, "characteristics.power.normalized_per_processor": 0.027150546186089516, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0c4a0a7ee4be6a03", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 44123632, "90.00 percentile latency (ns)": 51240277, "90th percentile latency (ns)": 51240277, "95.00 percentile latency (ns)": 57468675, "97.00 percentile latency (ns)": 61738810, "99.00 percentile latency (ns)": 64078364, "99.90 percentile latency (ns)": 69817633, "Max latency (ns)": 76676668, "Mean latency (ns)": 45786754, "Min duration satisfied": "Yes", "Min latency (ns)": 43306040, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.83, "QPS w/o loadgen overhead": 21.84, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 51.240277, "characteristics.90th_percentile_latency_ns": 51240277.0, "characteristics.90th_percentile_latency_s": 0.051240277, "characteristics.90th_percentile_latency_us": 51240.277, "characteristics.accuracy": 70.624, "characteristics.good": 35312, "characteristics.power": 0.3104523823700499, "characteristics.power.normalized_per_core": 0.0025871031864170826, "characteristics.power.normalized_per_processor": 0.3104523823700499, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20.8333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2b6291b541078995", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11266146, "90.00 percentile latency (ns)": 17240799, "90th percentile latency (ns)": 17240799, "95.00 percentile latency (ns)": 17661570, "97.00 percentile latency (ns)": 18308438, "99.00 percentile latency (ns)": 19288067, "99.90 percentile latency (ns)": 22901715, "Max latency (ns)": 37607568, "Mean latency (ns)": 12445264, "Min duration satisfied": "Yes", "Min latency (ns)": 10452200, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 80.25, "QPS w/o loadgen overhead": 80.35, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.240799, "characteristics.90th_percentile_latency_ns": 17240799.0, "characteristics.90th_percentile_latency_s": 0.017240799, "characteristics.90th_percentile_latency_us": 17240.799, "characteristics.accuracy": 63.442, "characteristics.good": 31721, "characteristics.power": 0.08029089138761597, "characteristics.power.normalized_per_core": 0.0006690907615634664, "characteristics.power.normalized_per_processor": 0.08029089138761597, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "abfa07e2cfc630a4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 22773070, "90.00 percentile latency (ns)": 25002214, "90th percentile latency (ns)": 25002214, "95.00 percentile latency (ns)": 32955866, "97.00 percentile latency (ns)": 37438954, "99.00 percentile latency (ns)": 40955997, "99.90 percentile latency (ns)": 44513624, "Max latency (ns)": 49584983, "Mean latency (ns)": 23861912, "Min duration satisfied": "Yes", "Min latency (ns)": 22425243, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.88, "QPS w/o loadgen overhead": 41.91, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 25.002214, "characteristics.90th_percentile_latency_ns": 25002214.0, "characteristics.90th_percentile_latency_s": 0.025002214, "characteristics.90th_percentile_latency_us": 25002.214, "characteristics.accuracy": 70.094, "characteristics.good": 35047, "characteristics.power": 0.17134201863136478, "characteristics.power.normalized_per_core": 0.0014278501552613732, "characteristics.power.normalized_per_processor": 0.17134201863136478, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5b47b6327b0c19f2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 214360323, "90.00 percentile latency (ns)": 230770955, "90th percentile latency (ns)": 230770955, "95.00 percentile latency (ns)": 239611503, "97.00 percentile latency (ns)": 251716889, "99.00 percentile latency (ns)": 329377347, "99.90 percentile latency (ns)": 360095929, "Max latency (ns)": 363027148, "Mean latency (ns)": 221498146, "Min duration satisfied": "Yes", "Min latency (ns)": 212327872, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.51, "QPS w/o loadgen overhead": 4.51, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 230.770955, "characteristics.90th_percentile_latency_ns": 230770955.0, "characteristics.90th_percentile_latency_s": 0.230770955, "characteristics.90th_percentile_latency_us": 230770.955, "characteristics.accuracy": 74.116, "characteristics.good": 37058, "characteristics.power": 1.5656063555090762, "characteristics.power.normalized_per_core": 0.013046719629242302, "characteristics.power.normalized_per_processor": 1.5656063555090762, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.52489, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "392d0d345149d042", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7552250, "90.00 percentile latency (ns)": 11090109, "90th percentile latency (ns)": 11090109, "95.00 percentile latency (ns)": 11339733, "97.00 percentile latency (ns)": 11668088, "99.00 percentile latency (ns)": 12377748, "99.90 percentile latency (ns)": 15209115, "Max latency (ns)": 30900240, "Mean latency (ns)": 8271151, "Min duration satisfied": "Yes", "Min latency (ns)": 6875791, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 120.66, "QPS w/o loadgen overhead": 120.9, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.090109, "characteristics.90th_percentile_latency_ns": 11090109.0, "characteristics.90th_percentile_latency_s": 0.011090109, "characteristics.90th_percentile_latency_us": 11090.109, "characteristics.accuracy": 59.432, "characteristics.good": 29716, "characteristics.power": 0.052438589803089644, "characteristics.power.normalized_per_core": 0.00043698824835908034, "characteristics.power.normalized_per_processor": 0.052438589803089644, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3589d35e93341609", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9149567, "90.00 percentile latency (ns)": 9623719, "90th percentile latency (ns)": 9623719, "95.00 percentile latency (ns)": 14543047, "97.00 percentile latency (ns)": 15162695, "99.00 percentile latency (ns)": 15873712, "99.90 percentile latency (ns)": 18742734, "Max latency (ns)": 28152749, "Mean latency (ns)": 9602843, "Min duration satisfied": "Yes", "Min latency (ns)": 8900830, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 103.98, "QPS w/o loadgen overhead": 104.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.623719, "characteristics.90th_percentile_latency_ns": 9623719.0, "characteristics.90th_percentile_latency_s": 0.009623719, "characteristics.90th_percentile_latency_us": 9623.719, "characteristics.accuracy": 61.458, "characteristics.good": 30729, "characteristics.power": 0.06421738349875594, "characteristics.power.normalized_per_core": 0.0005351448624896329, "characteristics.power.normalized_per_processor": 0.06421738349875594, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "da1095b80c0109e9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13427883, "90.00 percentile latency (ns)": 17408890, "90th percentile latency (ns)": 17408890, "95.00 percentile latency (ns)": 20134221, "97.00 percentile latency (ns)": 20863339, "99.00 percentile latency (ns)": 22056055, "99.90 percentile latency (ns)": 26409014, "Max latency (ns)": 43141567, "Mean latency (ns)": 14293197, "Min duration satisfied": "Yes", "Min latency (ns)": 12830214, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 69.88, "QPS w/o loadgen overhead": 69.96, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.40889, "characteristics.90th_percentile_latency_ns": 17408890.0, "characteristics.90th_percentile_latency_s": 0.01740889, "characteristics.90th_percentile_latency_us": 17408.89, "characteristics.accuracy": 58.544, "characteristics.good": 29272, "characteristics.power": 0.09184177738090459, "characteristics.power.normalized_per_core": 0.0007653481448408715, "characteristics.power.normalized_per_processor": 0.09184177738090459, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "69bbafc1854b1cae", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 19633524, "90.00 percentile latency (ns)": 23900229, "90th percentile latency (ns)": 23900229, "95.00 percentile latency (ns)": 27573207, "97.00 percentile latency (ns)": 28172247, "99.00 percentile latency (ns)": 29613333, "99.90 percentile latency (ns)": 35124527, "Max latency (ns)": 44563271, "Mean latency (ns)": 20604100, "Min duration satisfied": "Yes", "Min latency (ns)": 18902977, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 48.5, "QPS w/o loadgen overhead": 48.53, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.900229, "characteristics.90th_percentile_latency_ns": 23900229.0, "characteristics.90th_percentile_latency_s": 0.023900229, "characteristics.90th_percentile_latency_us": 23900.229, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.power": 0.1268316236232108, "characteristics.power.normalized_per_core": 0.0010569301968600898, "characteristics.power.normalized_per_processor": 0.1268316236232108, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7b75b31876449d29", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 83829787, "90.00 percentile latency (ns)": 98478035, "90th percentile latency (ns)": 98478035, "95.00 percentile latency (ns)": 104373234, "97.00 percentile latency (ns)": 120068451, "99.00 percentile latency (ns)": 124515281, "99.90 percentile latency (ns)": 131719459, "Max latency (ns)": 138211047, "Mean latency (ns)": 87100527, "Min duration satisfied": "Yes", "Min latency (ns)": 82229753, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 11.48, "QPS w/o loadgen overhead": 11.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 98.478035, "characteristics.90th_percentile_latency_ns": 98478035.0, "characteristics.90th_percentile_latency_s": 0.098478035, "characteristics.90th_percentile_latency_us": 98478.035, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.5734965298951706, "characteristics.power.normalized_per_core": 0.004779137749126422, "characteristics.power.normalized_per_processor": 0.5734965298951706, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 11.4943, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2e3f1deee4f6fb35", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 21882481, "90.00 percentile latency (ns)": 26589232, "90th percentile latency (ns)": 26589232, "95.00 percentile latency (ns)": 32136917, "97.00 percentile latency (ns)": 35152772, "99.00 percentile latency (ns)": 36976272, "99.90 percentile latency (ns)": 41522547, "Max latency (ns)": 49967406, "Mean latency (ns)": 23064513, "Min duration satisfied": "Yes", "Min latency (ns)": 20761008, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 43.32, "QPS w/o loadgen overhead": 43.36, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.589232, "characteristics.90th_percentile_latency_ns": 26589232.0, "characteristics.90th_percentile_latency_s": 0.026589232, "characteristics.90th_percentile_latency_us": 26589.232, "characteristics.accuracy": 69.678, "characteristics.good": 34839, "characteristics.power": 0.15554011643965798, "characteristics.power.normalized_per_core": 0.0012961676369971499, "characteristics.power.normalized_per_processor": 0.15554011643965798, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3a73167d4d918a0b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 36232731, "90.00 percentile latency (ns)": 41751166, "90th percentile latency (ns)": 41751166, "95.00 percentile latency (ns)": 50768599, "97.00 percentile latency (ns)": 55629420, "99.00 percentile latency (ns)": 57769004, "99.90 percentile latency (ns)": 61067485, "Max latency (ns)": 65592721, "Mean latency (ns)": 37883957, "Min duration satisfied": "Yes", "Min latency (ns)": 35638967, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 26.39, "QPS w/o loadgen overhead": 26.4, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 41.751166, "characteristics.90th_percentile_latency_ns": 41751166.0, "characteristics.90th_percentile_latency_s": 0.041751166, "characteristics.90th_percentile_latency_us": 41751.166, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.power": 0.24927833931506319, "characteristics.power.normalized_per_core": 0.0020773194942921933, "characteristics.power.normalized_per_processor": 0.24927833931506319, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 24.3902, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "924f3ea2a4a042cd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 24558893, "90.00 percentile latency (ns)": 28580378, "90th percentile latency (ns)": 28580378, "95.00 percentile latency (ns)": 35755860, "97.00 percentile latency (ns)": 40090048, "99.00 percentile latency (ns)": 42043720, "99.90 percentile latency (ns)": 47035735, "Max latency (ns)": 53679202, "Mean latency (ns)": 25897128, "Min duration satisfied": "Yes", "Min latency (ns)": 23968903, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 38.59, "QPS w/o loadgen overhead": 38.61, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.580378, "characteristics.90th_percentile_latency_ns": 28580378.0, "characteristics.90th_percentile_latency_s": 0.028580378, "characteristics.90th_percentile_latency_us": 28580.378, "characteristics.accuracy": 68.76, "characteristics.good": 34380, "characteristics.power": 0.1764220626484126, "characteristics.power.normalized_per_core": 0.0014701838554034383, "characteristics.power.normalized_per_processor": 0.1764220626484126, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "44418795517f3df9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16511179, "90.00 percentile latency (ns)": 18868639, "90th percentile latency (ns)": 18868639, "95.00 percentile latency (ns)": 20886106, "97.00 percentile latency (ns)": 21293540, "99.00 percentile latency (ns)": 22445883, "99.90 percentile latency (ns)": 25850113, "Max latency (ns)": 42356217, "Mean latency (ns)": 17014335, "Min duration satisfied": "Yes", "Min latency (ns)": 15991933, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 58.72, "QPS w/o loadgen overhead": 58.77, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.868639, "characteristics.90th_percentile_latency_ns": 18868639.0, "characteristics.90th_percentile_latency_s": 0.018868639, "characteristics.90th_percentile_latency_us": 18868.639, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.power": 0.09852205563464903, "characteristics.power.normalized_per_core": 0.0008210171302887419, "characteristics.power.normalized_per_processor": 0.09852205563464903, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "54a56bf8a4f32e57", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8727865, "90.00 percentile latency (ns)": 11578539, "90th percentile latency (ns)": 11578539, "95.00 percentile latency (ns)": 12159342, "97.00 percentile latency (ns)": 12565310, "99.00 percentile latency (ns)": 13380840, "99.90 percentile latency (ns)": 16198086, "Max latency (ns)": 31681158, "Mean latency (ns)": 9355861, "Min duration satisfied": "Yes", "Min latency (ns)": 8252994, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 106.72, "QPS w/o loadgen overhead": 106.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.578539, "characteristics.90th_percentile_latency_ns": 11578539.0, "characteristics.90th_percentile_latency_s": 0.011578539, "characteristics.90th_percentile_latency_us": 11578.539, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.power": 0.05634936251819378, "characteristics.power.normalized_per_core": 0.00046957802098494816, "characteristics.power.normalized_per_processor": 0.05634936251819378, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6bdf2861e4399a11", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 55925288, "90.00 percentile latency (ns)": 65465759, "90th percentile latency (ns)": 65465759, "95.00 percentile latency (ns)": 69840860, "97.00 percentile latency (ns)": 76871660, "99.00 percentile latency (ns)": 79853626, "99.90 percentile latency (ns)": 87847318, "Max latency (ns)": 99614390, "Mean latency (ns)": 57881938, "Min duration satisfied": "Yes", "Min latency (ns)": 54763283, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.27, "QPS w/o loadgen overhead": 17.28, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 65.465759, "characteristics.90th_percentile_latency_ns": 65465759.0, "characteristics.90th_percentile_latency_s": 0.065465759, "characteristics.90th_percentile_latency_us": 65465.759, "characteristics.accuracy": 71.674, "characteristics.good": 35837, "characteristics.power": 0.40070563943183574, "characteristics.power.normalized_per_core": 0.0033392136619319643, "characteristics.power.normalized_per_processor": 0.40070563943183574, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.129, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "95c0c986a4e14b61", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5369040, "90.00 percentile latency (ns)": 6825258, "90th percentile latency (ns)": 6825258, "95.00 percentile latency (ns)": 7019965, "97.00 percentile latency (ns)": 7257698, "99.00 percentile latency (ns)": 7957715, "99.90 percentile latency (ns)": 11526636, "Max latency (ns)": 26899795, "Mean latency (ns)": 5705417, "Min duration satisfied": "Yes", "Min latency (ns)": 4841349, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 174.75, "QPS w/o loadgen overhead": 175.27, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.825258, "characteristics.90th_percentile_latency_ns": 6825258.0, "characteristics.90th_percentile_latency_s": 0.006825258, "characteristics.90th_percentile_latency_us": 6825.258, "characteristics.accuracy": 43.454, "characteristics.good": 21727, "characteristics.power": 0.03331149298342998, "characteristics.power.normalized_per_core": 0.0002775957748619165, "characteristics.power.normalized_per_processor": 0.03331149298342998, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5014cd2b3ae9fcc8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 264639122, "90.00 percentile latency (ns)": 285170420, "90th percentile latency (ns)": 285170420, "95.00 percentile latency (ns)": 299276097, "97.00 percentile latency (ns)": 353649016, "99.00 percentile latency (ns)": 418448499, "99.90 percentile latency (ns)": 423447616, "Max latency (ns)": 430766958, "Mean latency (ns)": 274857246, "Min duration satisfied": "Yes", "Min latency (ns)": 261124786, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.64, "QPS w/o loadgen overhead": 3.64, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 285.17042, "characteristics.90th_percentile_latency_ns": 285170420.0, "characteristics.90th_percentile_latency_s": 0.28517042, "characteristics.90th_percentile_latency_us": 285170.42, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.8938073692910153, "characteristics.power.normalized_per_core": 0.015781728077425127, "characteristics.power.normalized_per_processor": 1.8938073692910153, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.62319, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f830a9b1ca8aac37", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 22599671, "90.00 percentile latency (ns)": 26264949, "90th percentile latency (ns)": 26264949, "95.00 percentile latency (ns)": 32771581, "97.00 percentile latency (ns)": 36818438, "99.00 percentile latency (ns)": 38952423, "99.90 percentile latency (ns)": 42777091, "Max latency (ns)": 50834677, "Mean latency (ns)": 23774223, "Min duration satisfied": "Yes", "Min latency (ns)": 21899763, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 42.03, "QPS w/o loadgen overhead": 42.06, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.264949, "characteristics.90th_percentile_latency_ns": 26264949.0, "characteristics.90th_percentile_latency_s": 0.026264949, "characteristics.90th_percentile_latency_us": 26264.949, "characteristics.accuracy": 70.33, "characteristics.good": 35165, "characteristics.power": 0.16063789797248784, "characteristics.power.normalized_per_core": 0.001338649149770732, "characteristics.power.normalized_per_processor": 0.16063789797248784, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7aa040178ee6d94a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 18361657, "90.00 percentile latency (ns)": 21187816, "90th percentile latency (ns)": 21187816, "95.00 percentile latency (ns)": 26901300, "97.00 percentile latency (ns)": 30351131, "99.00 percentile latency (ns)": 31701952, "99.90 percentile latency (ns)": 35561697, "Max latency (ns)": 40154540, "Mean latency (ns)": 19304104, "Min duration satisfied": "Yes", "Min latency (ns)": 17988299, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 51.76, "QPS w/o loadgen overhead": 51.8, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.187816, "characteristics.90th_percentile_latency_ns": 21187816.0, "characteristics.90th_percentile_latency_s": 0.021187816, "characteristics.90th_percentile_latency_us": 21187.816, "characteristics.accuracy": 67.4, "characteristics.good": 33700, "characteristics.power": 0.13058633358771526, "characteristics.power.normalized_per_core": 0.0010882194465642939, "characteristics.power.normalized_per_processor": 0.13058633358771526, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a15836ffdd07337e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15283781, "90.00 percentile latency (ns)": 16466029, "90th percentile latency (ns)": 16466029, "95.00 percentile latency (ns)": 22304717, "97.00 percentile latency (ns)": 25919025, "99.00 percentile latency (ns)": 27117736, "99.90 percentile latency (ns)": 30374499, "Max latency (ns)": 40244704, "Mean latency (ns)": 16014256, "Min duration satisfied": "Yes", "Min latency (ns)": 14961597, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.39, "QPS w/o loadgen overhead": 62.44, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.466029, "characteristics.90th_percentile_latency_ns": 16466029.0, "characteristics.90th_percentile_latency_s": 0.016466029, "characteristics.90th_percentile_latency_us": 16466.029, "characteristics.accuracy": 67.208, "characteristics.good": 33604, "characteristics.power": 0.11179004489298276, "characteristics.power.normalized_per_core": 0.000931583707441523, "characteristics.power.normalized_per_processor": 0.11179004489298276, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "03844133b17d7400", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 22983640, "90.00 percentile latency (ns)": 26622024, "90th percentile latency (ns)": 26622024, "95.00 percentile latency (ns)": 31949181, "97.00 percentile latency (ns)": 32754751, "99.00 percentile latency (ns)": 33888317, "99.90 percentile latency (ns)": 37455064, "Max latency (ns)": 49860803, "Mean latency (ns)": 23875620, "Min duration satisfied": "Yes", "Min latency (ns)": 22378665, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.86, "QPS w/o loadgen overhead": 41.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.622024, "characteristics.90th_percentile_latency_ns": 26622024.0, "characteristics.90th_percentile_latency_s": 0.026622024, "characteristics.90th_percentile_latency_us": 26622.024, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.power": 0.14719256457854007, "characteristics.power.normalized_per_core": 0.0012266047048211672, "characteristics.power.normalized_per_processor": 0.14719256457854007, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "817a4312ad7b3bba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 17367710, "90.00 percentile latency (ns)": 18961117, "90th percentile latency (ns)": 18961117, "95.00 percentile latency (ns)": 24372676, "97.00 percentile latency (ns)": 25027754, "99.00 percentile latency (ns)": 26146986, "99.90 percentile latency (ns)": 29925400, "Max latency (ns)": 44977182, "Mean latency (ns)": 18005547, "Min duration satisfied": "Yes", "Min latency (ns)": 16853184, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 55.5, "QPS w/o loadgen overhead": 55.54, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.961117, "characteristics.90th_percentile_latency_ns": 18961117.0, "characteristics.90th_percentile_latency_s": 0.018961117, "characteristics.90th_percentile_latency_us": 18961.117, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.power": 0.11028281124613794, "characteristics.power.normalized_per_core": 0.0009190234270511495, "characteristics.power.normalized_per_processor": 0.11028281124613794, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "79e932f7cd24232a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14543176, "90.00 percentile latency (ns)": 17730493, "90th percentile latency (ns)": 17730493, "95.00 percentile latency (ns)": 19054482, "97.00 percentile latency (ns)": 19480936, "99.00 percentile latency (ns)": 20745370, "99.90 percentile latency (ns)": 24723244, "Max latency (ns)": 36385503, "Mean latency (ns)": 15200031, "Min duration satisfied": "Yes", "Min latency (ns)": 13941727, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 65.72, "QPS w/o loadgen overhead": 65.79, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.730493, "characteristics.90th_percentile_latency_ns": 17730493.0, "characteristics.90th_percentile_latency_s": 0.017730493, "characteristics.90th_percentile_latency_us": 17730.493, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.power": 0.089268723423248, "characteristics.power.normalized_per_core": 0.0007439060285270667, "characteristics.power.normalized_per_processor": 0.089268723423248, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2e4d21b806e748f7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20107007, "90.00 percentile latency (ns)": 24314556, "90th percentile latency (ns)": 24314556, "95.00 percentile latency (ns)": 29686093, "97.00 percentile latency (ns)": 31114526, "99.00 percentile latency (ns)": 32354678, "99.90 percentile latency (ns)": 36128530, "Max latency (ns)": 41895458, "Mean latency (ns)": 21105938, "Min duration satisfied": "Yes", "Min latency (ns)": 19667978, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 47.35, "QPS w/o loadgen overhead": 47.38, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.314556, "characteristics.90th_percentile_latency_ns": 24314556.0, "characteristics.90th_percentile_latency_s": 0.024314556, "characteristics.90th_percentile_latency_us": 24314.556, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.power": 0.13605797052475033, "characteristics.power.normalized_per_core": 0.001133816421039586, "characteristics.power.normalized_per_processor": 0.13605797052475033, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1d09cebe55284147", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5657595, "90.00 percentile latency (ns)": 7188394, "90th percentile latency (ns)": 7188394, "95.00 percentile latency (ns)": 7424797, "97.00 percentile latency (ns)": 7687699, "99.00 percentile latency (ns)": 8426904, "99.90 percentile latency (ns)": 12078693, "Max latency (ns)": 23540939, "Mean latency (ns)": 6018373, "Min duration satisfied": "Yes", "Min latency (ns)": 5042016, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 165.7, "QPS w/o loadgen overhead": 166.16, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.188394, "characteristics.90th_percentile_latency_ns": 7188394.0, "characteristics.90th_percentile_latency_s": 0.007188394, "characteristics.90th_percentile_latency_us": 7188.394, "characteristics.accuracy": 49.296, "characteristics.good": 24648, "characteristics.power": 0.03523352021387659, "characteristics.power.normalized_per_core": 0.0002936126684489716, "characteristics.power.normalized_per_processor": 0.03523352021387659, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5983b36a5a27d70b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10238449, "90.00 percentile latency (ns)": 15465253, "90th percentile latency (ns)": 15465253, "95.00 percentile latency (ns)": 15753875, "97.00 percentile latency (ns)": 16277843, "99.00 percentile latency (ns)": 17251840, "99.90 percentile latency (ns)": 20705131, "Max latency (ns)": 36434064, "Mean latency (ns)": 11324144, "Min duration satisfied": "Yes", "Min latency (ns)": 9511261, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 88.18, "QPS w/o loadgen overhead": 88.31, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.465253, "characteristics.90th_percentile_latency_ns": 15465253.0, "characteristics.90th_percentile_latency_s": 0.015465253, "characteristics.90th_percentile_latency_us": 15465.253, "characteristics.accuracy": 62.082, "characteristics.good": 31041, "characteristics.power": 0.07167196660058761, "characteristics.power.normalized_per_core": 0.0005972663883382301, "characteristics.power.normalized_per_processor": 0.07167196660058761, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a569484714b1dc2a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12530180, "90.00 percentile latency (ns)": 16045167, "90th percentile latency (ns)": 16045167, "95.00 percentile latency (ns)": 17424760, "97.00 percentile latency (ns)": 17888378, "99.00 percentile latency (ns)": 19223439, "99.90 percentile latency (ns)": 23104760, "Max latency (ns)": 29552601, "Mean latency (ns)": 13278291, "Min duration satisfied": "Yes", "Min latency (ns)": 11914775, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 75.23, "QPS w/o loadgen overhead": 75.31, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.045167, "characteristics.90th_percentile_latency_ns": 16045167.0, "characteristics.90th_percentile_latency_s": 0.016045167, "characteristics.90th_percentile_latency_us": 16045.167, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.power": 0.08070691776745927, "characteristics.power.normalized_per_core": 0.0006725576480621605, "characteristics.power.normalized_per_processor": 0.08070691776745927, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f143f3f4b194c7db", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 2984191, "90.00 percentile latency (ns)": 3804321, "90th percentile latency (ns)": 3804321, "95.00 percentile latency (ns)": 4132850, "97.00 percentile latency (ns)": 4212330, "99.00 percentile latency (ns)": 4454343, "99.90 percentile latency (ns)": 7253890, "Max latency (ns)": 23190657, "Mean latency (ns)": 3120435, "Min duration satisfied": "Yes", "Min latency (ns)": 2665531, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 319.12, "QPS w/o loadgen overhead": 320.47, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.804321, "characteristics.90th_percentile_latency_ns": 3804321.0, "characteristics.90th_percentile_latency_s": 0.003804321, "characteristics.90th_percentile_latency_us": 3804.321, "characteristics.accuracy": 42.348, "characteristics.good": 21174, "characteristics.power": 0.018529451395874228, "characteristics.power.normalized_per_core": 0.00015441209496561858, "characteristics.power.normalized_per_processor": 0.018529451395874228, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5444aa1ab194103a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 71398143, "90.00 percentile latency (ns)": 85553942, "90th percentile latency (ns)": 85553942, "95.00 percentile latency (ns)": 91482459, "97.00 percentile latency (ns)": 102440989, "99.00 percentile latency (ns)": 106189614, "99.90 percentile latency (ns)": 110471665, "Max latency (ns)": 114170974, "Mean latency (ns)": 74592103, "Min duration satisfied": "Yes", "Min latency (ns)": 70595898, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.4, "QPS w/o loadgen overhead": 13.41, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 85.553942, "characteristics.90th_percentile_latency_ns": 85553942.0, "characteristics.90th_percentile_latency_s": 0.085553942, "characteristics.90th_percentile_latency_us": 85553.942, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.power": 0.4788090175451681, "characteristics.power.normalized_per_core": 0.003990075146209734, "characteristics.power.normalized_per_processor": 0.4788090175451681, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1e894d45ace7e356", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12677029, "90.00 percentile latency (ns)": 17343769, "90th percentile latency (ns)": 17343769, "95.00 percentile latency (ns)": 18915439, "97.00 percentile latency (ns)": 19694636, "99.00 percentile latency (ns)": 20830296, "99.90 percentile latency (ns)": 25139350, "Max latency (ns)": 40680253, "Mean latency (ns)": 13609334, "Min duration satisfied": "Yes", "Min latency (ns)": 12028638, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 73.39, "QPS w/o loadgen overhead": 73.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.343769, "characteristics.90th_percentile_latency_ns": 17343769.0, "characteristics.90th_percentile_latency_s": 0.017343769, "characteristics.90th_percentile_latency_us": 17343.769, "characteristics.accuracy": 64.062, "characteristics.good": 32031, "characteristics.power": 0.08481726759872464, "characteristics.power.normalized_per_core": 0.0007068105633227053, "characteristics.power.normalized_per_processor": 0.08481726759872464, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6144beb0da8dc8d4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 107023392, "90.00 percentile latency (ns)": 122852206, "90th percentile latency (ns)": 122852206, "95.00 percentile latency (ns)": 127200496, "97.00 percentile latency (ns)": 151239267, "99.00 percentile latency (ns)": 164854322, "99.90 percentile latency (ns)": 172605437, "Max latency (ns)": 176170620, "Mean latency (ns)": 111604824, "Min duration satisfied": "Yes", "Min latency (ns)": 106025248, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 8.96, "QPS w/o loadgen overhead": 8.96, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 122.852206, "characteristics.90th_percentile_latency_ns": 122852206.0, "characteristics.90th_percentile_latency_s": 0.122852206, "characteristics.90th_percentile_latency_us": 122852.206, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.7476106284248133, "characteristics.power.normalized_per_core": 0.006230088570206778, "characteristics.power.normalized_per_processor": 0.7476106284248133, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 8.69565, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d76d4c9a996eb05e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5369935, "90.00 percentile latency (ns)": 7707324, "90th percentile latency (ns)": 7707324, "95.00 percentile latency (ns)": 7966370, "97.00 percentile latency (ns)": 8177990, "99.00 percentile latency (ns)": 8777109, "99.90 percentile latency (ns)": 11794662, "Max latency (ns)": 29537837, "Mean latency (ns)": 5829649, "Min duration satisfied": "Yes", "Min latency (ns)": 4867150, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 171.08, "QPS w/o loadgen overhead": 171.54, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.707324, "characteristics.90th_percentile_latency_ns": 7707324.0, "characteristics.90th_percentile_latency_s": 0.007707324, "characteristics.90th_percentile_latency_us": 7707.324, "characteristics.accuracy": 56.738, "characteristics.good": 28369, "characteristics.power": 0.0364980925326257, "characteristics.power.normalized_per_core": 0.0003041507711052142, "characteristics.power.normalized_per_processor": 0.0364980925326257, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a5b88260a7958999", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7762233, "90.00 percentile latency (ns)": 10320504, "90th percentile latency (ns)": 10320504, "95.00 percentile latency (ns)": 10637323, "97.00 percentile latency (ns)": 10930502, "99.00 percentile latency (ns)": 11972350, "99.90 percentile latency (ns)": 15465926, "Max latency (ns)": 29719019, "Mean latency (ns)": 8331354, "Min duration satisfied": "Yes", "Min latency (ns)": 7079679, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 119.8, "QPS w/o loadgen overhead": 120.03, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.320504, "characteristics.90th_percentile_latency_ns": 10320504.0, "characteristics.90th_percentile_latency_s": 0.010320504, "characteristics.90th_percentile_latency_us": 10320.504, "characteristics.accuracy": 57.054, "characteristics.good": 28527, "characteristics.power": 0.05091197462331487, "characteristics.power.normalized_per_core": 0.0004242664551942906, "characteristics.power.normalized_per_processor": 0.05091197462331487, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "19e441c99d237748", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 75343974, "90.00 percentile latency (ns)": 88851667, "90th percentile latency (ns)": 88851667, "95.00 percentile latency (ns)": 96654508, "97.00 percentile latency (ns)": 109259055, "99.00 percentile latency (ns)": 113082266, "99.90 percentile latency (ns)": 117816546, "Max latency (ns)": 120882422, "Mean latency (ns)": 78640556, "Min duration satisfied": "Yes", "Min latency (ns)": 74476808, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.71, "QPS w/o loadgen overhead": 12.72, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 88.851667, "characteristics.90th_percentile_latency_ns": 88851667.0, "characteristics.90th_percentile_latency_s": 0.088851667, "characteristics.90th_percentile_latency_us": 88851.667, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.power": 0.5118991437126074, "characteristics.power.normalized_per_core": 0.004265826197605061, "characteristics.power.normalized_per_processor": 0.5118991437126074, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.3457, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "45f680a6054b111f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7607885, "90.00 percentile latency (ns)": 9232329, "90th percentile latency (ns)": 9232329, "95.00 percentile latency (ns)": 9804150, "97.00 percentile latency (ns)": 10089236, "99.00 percentile latency (ns)": 10940385, "99.90 percentile latency (ns)": 13966742, "Max latency (ns)": 27412347, "Mean latency (ns)": 7925615, "Min duration satisfied": "Yes", "Min latency (ns)": 7003935, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 125.94, "QPS w/o loadgen overhead": 126.17, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.232329, "characteristics.90th_percentile_latency_ns": 9232329.0, "characteristics.90th_percentile_latency_s": 0.009232329, "characteristics.90th_percentile_latency_us": 9232.329, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.power": 0.04604071380171944, "characteristics.power.normalized_per_core": 0.00038367261501432863, "characteristics.power.normalized_per_processor": 0.04604071380171944, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1829770be477fb3d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 43786582, "90.00 percentile latency (ns)": 53141720, "90th percentile latency (ns)": 53141720, "95.00 percentile latency (ns)": 58787936, "97.00 percentile latency (ns)": 61940607, "99.00 percentile latency (ns)": 64508140, "99.90 percentile latency (ns)": 71159294, "Max latency (ns)": 79710807, "Mean latency (ns)": 45775020, "Min duration satisfied": "Yes", "Min latency (ns)": 43156571, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.84, "QPS w/o loadgen overhead": 21.85, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 53.14172, "characteristics.90th_percentile_latency_ns": 53141720.0, "characteristics.90th_percentile_latency_s": 0.05314172, "characteristics.90th_percentile_latency_us": 53141.72, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.power": 0.2865667518369619, "characteristics.power.normalized_per_core": 0.002388056265308016, "characteristics.power.normalized_per_processor": 0.2865667518369619, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "fffbb39b4f33b612", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20784521, "90.00 percentile latency (ns)": 25086816, "90th percentile latency (ns)": 25086816, "95.00 percentile latency (ns)": 30033670, "97.00 percentile latency (ns)": 31005827, "99.00 percentile latency (ns)": 32445656, "99.90 percentile latency (ns)": 37521657, "Max latency (ns)": 45150692, "Mean latency (ns)": 21850465, "Min duration satisfied": "Yes", "Min latency (ns)": 20196216, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 45.73, "QPS w/o loadgen overhead": 45.77, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 25.086816, "characteristics.90th_percentile_latency_ns": 25086816.0, "characteristics.90th_percentile_latency_s": 0.025086816, "characteristics.90th_percentile_latency_us": 25086.816, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.power": 0.14681592170342278, "characteristics.power.normalized_per_core": 0.0012234660141951898, "characteristics.power.normalized_per_processor": 0.14681592170342278, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9224ca64e20bb6c9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 31359651, "90.00 percentile latency (ns)": 35714673, "90th percentile latency (ns)": 35714673, "95.00 percentile latency (ns)": 44711561, "97.00 percentile latency (ns)": 47817044, "99.00 percentile latency (ns)": 51563083, "99.90 percentile latency (ns)": 54883682, "Max latency (ns)": 58494117, "Mean latency (ns)": 32809212, "Min duration satisfied": "Yes", "Min latency (ns)": 30721207, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 30.47, "QPS w/o loadgen overhead": 30.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 35.714673, "characteristics.90th_percentile_latency_ns": 35714673.0, "characteristics.90th_percentile_latency_s": 0.035714673, "characteristics.90th_percentile_latency_us": 35714.673, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.power": 0.21669254259133436, "characteristics.power.normalized_per_core": 0.0018057711882611197, "characteristics.power.normalized_per_processor": 0.21669254259133436, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 28.5714, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5f0f84d028720ee6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10908725, "90.00 percentile latency (ns)": 13427874, "90th percentile latency (ns)": 13427874, "95.00 percentile latency (ns)": 14653162, "97.00 percentile latency (ns)": 15053894, "99.00 percentile latency (ns)": 16255942, "99.90 percentile latency (ns)": 19742995, "Max latency (ns)": 28704726, "Mean latency (ns)": 11446815, "Min duration satisfied": "Yes", "Min latency (ns)": 10288665, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 87.24, "QPS w/o loadgen overhead": 87.36, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.427874, "characteristics.90th_percentile_latency_ns": 13427874.0, "characteristics.90th_percentile_latency_s": 0.013427874, "characteristics.90th_percentile_latency_us": 13427.874, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.power": 0.0688269125039498, "characteristics.power.normalized_per_core": 0.0005735576041995817, "characteristics.power.normalized_per_processor": 0.0688269125039498, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e0404c8e91b49419", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 27490965, "90.00 percentile latency (ns)": 32967103, "90th percentile latency (ns)": 32967103, "95.00 percentile latency (ns)": 37333518, "97.00 percentile latency (ns)": 38670856, "99.00 percentile latency (ns)": 40191216, "99.90 percentile latency (ns)": 45658881, "Max latency (ns)": 53060696, "Mean latency (ns)": 28683791, "Min duration satisfied": "Yes", "Min latency (ns)": 26903682, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.84, "QPS w/o loadgen overhead": 34.86, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 32.967103, "characteristics.90th_percentile_latency_ns": 32967103.0, "characteristics.90th_percentile_latency_s": 0.032967103, "characteristics.90th_percentile_latency_us": 32967.103, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.power": 0.1758776947063028, "characteristics.power.normalized_per_core": 0.0014656474558858567, "characteristics.power.normalized_per_processor": 0.1758776947063028, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 34.4828, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "953a04fb4dc28daf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 32811822, "90.00 percentile latency (ns)": 39354455, "90th percentile latency (ns)": 39354455, "95.00 percentile latency (ns)": 43283370, "97.00 percentile latency (ns)": 44136602, "99.00 percentile latency (ns)": 46464025, "99.90 percentile latency (ns)": 52271006, "Max latency (ns)": 62635165, "Mean latency (ns)": 34077042, "Min duration satisfied": "Yes", "Min latency (ns)": 32008302, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 29.33, "QPS w/o loadgen overhead": 29.35, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 39.354455, "characteristics.90th_percentile_latency_ns": 39354455.0, "characteristics.90th_percentile_latency_s": 0.039354455, "characteristics.90th_percentile_latency_us": 39354.455, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.power": 0.2093015195523619, "characteristics.power.normalized_per_core": 0.0017441793296030159, "characteristics.power.normalized_per_processor": 0.2093015195523619, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c6704ed9927d55b9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 98325927, "90.00 percentile latency (ns)": 113342719, "90th percentile latency (ns)": 113342719, "95.00 percentile latency (ns)": 116231432, "97.00 percentile latency (ns)": 121350150, "99.00 percentile latency (ns)": 173616720, "99.90 percentile latency (ns)": 182869552, "Max latency (ns)": 183990820, "Mean latency (ns)": 102507920, "Min duration satisfied": "Yes", "Min latency (ns)": 97286704, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 9.75, "QPS w/o loadgen overhead": 9.76, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 113.342719, "characteristics.90th_percentile_latency_ns": 113342719.0, "characteristics.90th_percentile_latency_s": 0.113342719, "characteristics.90th_percentile_latency_us": 113342.719, "characteristics.accuracy": 71.254, "characteristics.good": 35627, "characteristics.power": 0.7279847470318191, "characteristics.power.normalized_per_core": 0.006066539558598493, "characteristics.power.normalized_per_processor": 0.7279847470318191, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 9.80392, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "40a8fdbb427064f9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 157517677, "90.00 percentile latency (ns)": 175505269, "90th percentile latency (ns)": 175505269, "95.00 percentile latency (ns)": 186579154, "97.00 percentile latency (ns)": 218420710, "99.00 percentile latency (ns)": 250141194, "99.90 percentile latency (ns)": 258385579, "Max latency (ns)": 260213769, "Mean latency (ns)": 164399218, "Min duration satisfied": "Yes", "Min latency (ns)": 155996112, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 6.08, "QPS w/o loadgen overhead": 6.08, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 175.505269, "characteristics.90th_percentile_latency_ns": 175505269.0, "characteristics.90th_percentile_latency_s": 0.175505269, "characteristics.90th_percentile_latency_us": 175505.269, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 1.1109174661372503, "characteristics.power.normalized_per_core": 0.009257645551143752, "characteristics.power.normalized_per_processor": 1.1109174661372503, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 6.21118, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c01f29453195b3ea", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 24168786, "90.00 percentile latency (ns)": 28946381, "90th percentile latency (ns)": 28946381, "95.00 percentile latency (ns)": 32793092, "97.00 percentile latency (ns)": 33731852, "99.00 percentile latency (ns)": 35297535, "99.90 percentile latency (ns)": 39910475, "Max latency (ns)": 50230787, "Mean latency (ns)": 25197008, "Min duration satisfied": "Yes", "Min latency (ns)": 23608701, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 39.66, "QPS w/o loadgen overhead": 39.69, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.946381, "characteristics.90th_percentile_latency_ns": 28946381.0, "characteristics.90th_percentile_latency_s": 0.028946381, "characteristics.90th_percentile_latency_us": 28946.381, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.power": 0.15292359178130097, "characteristics.power.normalized_per_core": 0.0012743632648441747, "characteristics.power.normalized_per_processor": 0.15292359178130097, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "39df4bc4bf24f11b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 302369450, "90.00 percentile latency (ns)": 321198499, "90th percentile latency (ns)": 321198499, "95.00 percentile latency (ns)": 330538153, "97.00 percentile latency (ns)": 377867625, "99.00 percentile latency (ns)": 444627621, "99.90 percentile latency (ns)": 461026500, "Max latency (ns)": 463345517, "Mean latency (ns)": 310545679, "Min duration satisfied": "Yes", "Min latency (ns)": 297509204, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.22, "QPS w/o loadgen overhead": 3.22, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 321.198499, "characteristics.90th_percentile_latency_ns": 321198499.0, "characteristics.90th_percentile_latency_s": 0.321198499, "characteristics.90th_percentile_latency_us": 321198.499, "characteristics.accuracy": 76.348, "characteristics.good": 38174, "characteristics.power": 2.218428143883042, "characteristics.power.normalized_per_core": 0.018486901199025352, "characteristics.power.normalized_per_processor": 2.218428143883042, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.24675, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4ef80c8dc340379e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8785596, "90.00 percentile latency (ns)": 12261707, "90th percentile latency (ns)": 12261707, "95.00 percentile latency (ns)": 12598011, "97.00 percentile latency (ns)": 12996511, "99.00 percentile latency (ns)": 13820306, "99.90 percentile latency (ns)": 16834724, "Max latency (ns)": 30222830, "Mean latency (ns)": 9649556, "Min duration satisfied": "Yes", "Min latency (ns)": 8052927, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 103.44, "QPS w/o loadgen overhead": 103.63, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.261707, "characteristics.90th_percentile_latency_ns": 12261707.0, "characteristics.90th_percentile_latency_s": 0.012261707, "characteristics.90th_percentile_latency_us": 12261.707, "characteristics.accuracy": 54.504, "characteristics.good": 27252, "characteristics.power": 0.058742427171951536, "characteristics.power.normalized_per_core": 0.0004895202264329295, "characteristics.power.normalized_per_processor": 0.058742427171951536, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "76c968415fa1c926", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9527917, "90.00 percentile latency (ns)": 11316230, "90th percentile latency (ns)": 11316230, "95.00 percentile latency (ns)": 11839083, "97.00 percentile latency (ns)": 12139822, "99.00 percentile latency (ns)": 12878643, "99.90 percentile latency (ns)": 16551283, "Max latency (ns)": 33013202, "Mean latency (ns)": 9819079, "Min duration satisfied": "Yes", "Min latency (ns)": 9051517, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 101.69, "QPS w/o loadgen overhead": 101.84, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.31623, "characteristics.90th_percentile_latency_ns": 11316230.0, "characteristics.90th_percentile_latency_s": 0.01131623, "characteristics.90th_percentile_latency_us": 11316.23, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.power": 0.05551141094480403, "characteristics.power.normalized_per_core": 0.00046259509120670023, "characteristics.power.normalized_per_processor": 0.05551141094480403, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a4c52b17a3276cf1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20993560, "90.00 percentile latency (ns)": 23941310, "90th percentile latency (ns)": 23941310, "95.00 percentile latency (ns)": 30718384, "97.00 percentile latency (ns)": 34887811, "99.00 percentile latency (ns)": 36295818, "99.90 percentile latency (ns)": 39354177, "Max latency (ns)": 47658884, "Mean latency (ns)": 22133365, "Min duration satisfied": "Yes", "Min latency (ns)": 20428072, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 45.15, "QPS w/o loadgen overhead": 45.18, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.94131, "characteristics.90th_percentile_latency_ns": 23941310.0, "characteristics.90th_percentile_latency_s": 0.02394131, "characteristics.90th_percentile_latency_us": 23941.31, "characteristics.accuracy": 68.124, "characteristics.good": 34062, "characteristics.power": 0.15429554254122121, "characteristics.power.normalized_per_core": 0.0012857961878435101, "characteristics.power.normalized_per_processor": 0.15429554254122121, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 45.4545, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "13466943dce4793b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 55074158, "90.00 percentile latency (ns)": 67372790, "90th percentile latency (ns)": 67372790, "95.00 percentile latency (ns)": 72258975, "97.00 percentile latency (ns)": 79808903, "99.00 percentile latency (ns)": 83472901, "99.90 percentile latency (ns)": 90295456, "Max latency (ns)": 99474654, "Mean latency (ns)": 57733684, "Min duration satisfied": "Yes", "Min latency (ns)": 54385655, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.32, "QPS w/o loadgen overhead": 17.32, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 67.37279, "characteristics.90th_percentile_latency_ns": 67372790.0, "characteristics.90th_percentile_latency_s": 0.06737279, "characteristics.90th_percentile_latency_us": 67372.79, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.power": 0.363480904273776, "characteristics.power.normalized_per_core": 0.0030290075356148, "characteristics.power.normalized_per_processor": 0.363480904273776, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.1818, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0fbf7447809892c4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 26182363, "90.00 percentile latency (ns)": 30914564, "90th percentile latency (ns)": 30914564, "95.00 percentile latency (ns)": 34109001, "97.00 percentile latency (ns)": 34806042, "99.00 percentile latency (ns)": 36416306, "99.90 percentile latency (ns)": 41665182, "Max latency (ns)": 54014878, "Mean latency (ns)": 27111926, "Min duration satisfied": "Yes", "Min latency (ns)": 25466804, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 36.86, "QPS w/o loadgen overhead": 36.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 30.914564, "characteristics.90th_percentile_latency_ns": 30914564.0, "characteristics.90th_percentile_latency_s": 0.030914564, "characteristics.90th_percentile_latency_us": 30914.564, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.power": 0.16057157583484763, "characteristics.power.normalized_per_core": 0.001338096465290397, "characteristics.power.normalized_per_processor": 0.16057157583484763, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 33.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b4b71ad8ed338b9b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11648504, "90.00 percentile latency (ns)": 17798392, "90th percentile latency (ns)": 17798392, "95.00 percentile latency (ns)": 19181961, "97.00 percentile latency (ns)": 19717610, "99.00 percentile latency (ns)": 20562949, "99.90 percentile latency (ns)": 23652176, "Max latency (ns)": 29965598, "Mean latency (ns)": 12818778, "Min duration satisfied": "Yes", "Min latency (ns)": 10673814, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 77.9, "QPS w/o loadgen overhead": 78.01, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.798392, "characteristics.90th_percentile_latency_ns": 17798392.0, "characteristics.90th_percentile_latency_s": 0.017798392, "characteristics.90th_percentile_latency_us": 17798.392, "characteristics.accuracy": 64.766, "characteristics.good": 32383, "characteristics.power": 0.08697177644679839, "characteristics.power.normalized_per_core": 0.0007247648037233199, "characteristics.power.normalized_per_processor": 0.08697177644679839, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8db90a5645f68092", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 43765641, "90.00 percentile latency (ns)": 52537930, "90th percentile latency (ns)": 52537930, "95.00 percentile latency (ns)": 56850120, "97.00 percentile latency (ns)": 57728261, "99.00 percentile latency (ns)": 60022011, "99.90 percentile latency (ns)": 66844117, "Max latency (ns)": 69698708, "Mean latency (ns)": 45389772, "Min duration satisfied": "Yes", "Min latency (ns)": 42307654, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 22.02, "QPS w/o loadgen overhead": 22.03, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 52.53793, "characteristics.90th_percentile_latency_ns": 52537930.0, "characteristics.90th_percentile_latency_s": 0.05253793, "characteristics.90th_percentile_latency_us": 52537.93, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.power": 0.2804980301881419, "characteristics.power.normalized_per_core": 0.0023374835849011826, "characteristics.power.normalized_per_processor": 0.2804980301881419, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 19.2308, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d7b4cb2bce57ef54", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11479255, "90.00 percentile latency (ns)": 13761360, "90th percentile latency (ns)": 13761360, "95.00 percentile latency (ns)": 18559000, "97.00 percentile latency (ns)": 19294262, "99.00 percentile latency (ns)": 20159800, "99.90 percentile latency (ns)": 23160534, "Max latency (ns)": 30268167, "Mean latency (ns)": 12133521, "Min duration satisfied": "Yes", "Min latency (ns)": 11110824, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 82.31, "QPS w/o loadgen overhead": 82.42, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.76136, "characteristics.90th_percentile_latency_ns": 13761360.0, "characteristics.90th_percentile_latency_s": 0.01376136, "characteristics.90th_percentile_latency_us": 13761.36, "characteristics.accuracy": 64.128, "characteristics.good": 32064, "characteristics.power": 0.08267364662984739, "characteristics.power.normalized_per_core": 0.0006889470552487282, "characteristics.power.normalized_per_processor": 0.08267364662984739, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "90f4d749be768c47", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 19439990, "90.00 percentile latency (ns)": 23407475, "90th percentile latency (ns)": 23407475, "95.00 percentile latency (ns)": 25280227, "97.00 percentile latency (ns)": 25820661, "99.00 percentile latency (ns)": 27286961, "99.90 percentile latency (ns)": 31730751, "Max latency (ns)": 42127269, "Mean latency (ns)": 20235021, "Min duration satisfied": "Yes", "Min latency (ns)": 18729001, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 49.38, "QPS w/o loadgen overhead": 49.42, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.407475, "characteristics.90th_percentile_latency_ns": 23407475.0, "characteristics.90th_percentile_latency_s": 0.023407475, "characteristics.90th_percentile_latency_us": 23407.475, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.power": 0.11934607222123234, "characteristics.power.normalized_per_core": 0.0009945506018436028, "characteristics.power.normalized_per_processor": 0.11934607222123234, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e8481f85e8b892d9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 38025970, "90.00 percentile latency (ns)": 45710216, "90th percentile latency (ns)": 45710216, "95.00 percentile latency (ns)": 52111799, "97.00 percentile latency (ns)": 52827270, "99.00 percentile latency (ns)": 55350512, "99.90 percentile latency (ns)": 61991122, "Max latency (ns)": 69816651, "Mean latency (ns)": 39671898, "Min duration satisfied": "Yes", "Min latency (ns)": 37362822, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 25.2, "QPS w/o loadgen overhead": 25.21, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 45.710216, "characteristics.90th_percentile_latency_ns": 45710216.0, "characteristics.90th_percentile_latency_s": 0.045710216, "characteristics.90th_percentile_latency_us": 45710.216, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.power": 0.244726265881394, "characteristics.power.normalized_per_core": 0.002039385549011617, "characteristics.power.normalized_per_processor": 0.244726265881394, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 26.3158, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e0404da9a8be8a00", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14525846, "90.00 percentile latency (ns)": 21036400, "90th percentile latency (ns)": 21036400, "95.00 percentile latency (ns)": 22611682, "97.00 percentile latency (ns)": 23389384, "99.00 percentile latency (ns)": 24452127, "99.90 percentile latency (ns)": 28268665, "Max latency (ns)": 37618865, "Mean latency (ns)": 15891947, "Min duration satisfied": "Yes", "Min latency (ns)": 13661268, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.86, "QPS w/o loadgen overhead": 62.92, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.0364, "characteristics.90th_percentile_latency_ns": 21036400.0, "characteristics.90th_percentile_latency_s": 0.0210364, "characteristics.90th_percentile_latency_us": 21036.4, "characteristics.accuracy": 65.004, "characteristics.good": 32502, "characteristics.power": 0.1027445640069489, "characteristics.power.normalized_per_core": 0.0008562047000579074, "characteristics.power.normalized_per_processor": 0.1027445640069489, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5b2830469f8b7944", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 51629603, "90.00 percentile latency (ns)": 62724501, "90th percentile latency (ns)": 62724501, "95.00 percentile latency (ns)": 69310010, "97.00 percentile latency (ns)": 71304535, "99.00 percentile latency (ns)": 74047822, "99.90 percentile latency (ns)": 80887195, "Max latency (ns)": 84392553, "Mean latency (ns)": 53821853, "Min duration satisfied": "Yes", "Min latency (ns)": 49553914, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.57, "QPS w/o loadgen overhead": 18.58, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 62.724501, "characteristics.90th_percentile_latency_ns": 62724501.0, "characteristics.90th_percentile_latency_s": 0.062724501, "characteristics.90th_percentile_latency_us": 62724.501, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.power": 0.3365464506762718, "characteristics.power.normalized_per_core": 0.0028045537556355984, "characteristics.power.normalized_per_processor": 0.3365464506762718, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "44bc8eeefdec2733", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 23948307, "90.00 percentile latency (ns)": 28996971, "90th percentile latency (ns)": 28996971, "95.00 percentile latency (ns)": 31888387, "97.00 percentile latency (ns)": 32659812, "99.00 percentile latency (ns)": 34251037, "99.90 percentile latency (ns)": 39551119, "Max latency (ns)": 51930986, "Mean latency (ns)": 24992624, "Min duration satisfied": "Yes", "Min latency (ns)": 23274212, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 39.99, "QPS w/o loadgen overhead": 40.01, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.996971, "characteristics.90th_percentile_latency_ns": 28996971.0, "characteristics.90th_percentile_latency_s": 0.028996971, "characteristics.90th_percentile_latency_us": 28996.971, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.power": 0.1534239769664809, "characteristics.power.normalized_per_core": 0.001278533141387341, "characteristics.power.normalized_per_processor": 0.1534239769664809, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 35.7143, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0a6383545854baea", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6724553, "90.00 percentile latency (ns)": 7927586, "90th percentile latency (ns)": 7927586, "95.00 percentile latency (ns)": 8344321, "97.00 percentile latency (ns)": 8603526, "99.00 percentile latency (ns)": 9307261, "99.90 percentile latency (ns)": 12232265, "Max latency (ns)": 26436590, "Mean latency (ns)": 6954529, "Min duration satisfied": "Yes", "Min latency (ns)": 6159232, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 143.47, "QPS w/o loadgen overhead": 143.79, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.927586, "characteristics.90th_percentile_latency_ns": 7927586.0, "characteristics.90th_percentile_latency_s": 0.007927586, "characteristics.90th_percentile_latency_us": 7927.586, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.power": 0.03972950617800259, "characteristics.power.normalized_per_core": 0.00033107921815002156, "characteristics.power.normalized_per_processor": 0.03972950617800259, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "374649b72c82c033", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11890369, "90.00 percentile latency (ns)": 14044344, "90th percentile latency (ns)": 14044344, "95.00 percentile latency (ns)": 15037725, "97.00 percentile latency (ns)": 15447644, "99.00 percentile latency (ns)": 16551900, "99.90 percentile latency (ns)": 19974142, "Max latency (ns)": 28708742, "Mean latency (ns)": 12345146, "Min duration satisfied": "Yes", "Min latency (ns)": 11382365, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 80.9, "QPS w/o loadgen overhead": 81.0, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.044344, "characteristics.90th_percentile_latency_ns": 14044344.0, "characteristics.90th_percentile_latency_s": 0.014044344, "characteristics.90th_percentile_latency_us": 14044.344, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.power": 0.07120814720877038, "characteristics.power.normalized_per_core": 0.0005934012267397531, "characteristics.power.normalized_per_processor": 0.07120814720877038, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4eb5ad7e7eadcc1d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13114836, "90.00 percentile latency (ns)": 16171374, "90th percentile latency (ns)": 16171374, "95.00 percentile latency (ns)": 18603539, "97.00 percentile latency (ns)": 19136934, "99.00 percentile latency (ns)": 20221407, "99.90 percentile latency (ns)": 23842729, "Max latency (ns)": 34048431, "Mean latency (ns)": 13740978, "Min duration satisfied": "Yes", "Min latency (ns)": 12397186, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 72.69, "QPS w/o loadgen overhead": 72.78, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.171374, "characteristics.90th_percentile_latency_ns": 16171374.0, "characteristics.90th_percentile_latency_s": 0.016171374, "characteristics.90th_percentile_latency_us": 16171.374, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.power": 0.09008270374670543, "characteristics.power.normalized_per_core": 0.000750689197889212, "characteristics.power.normalized_per_processor": 0.09008270374670543, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "44b399964bda88fb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6590922, "90.00 percentile latency (ns)": 9579815, "90th percentile latency (ns)": 9579815, "95.00 percentile latency (ns)": 9841597, "97.00 percentile latency (ns)": 10022861, "99.00 percentile latency (ns)": 10582632, "99.90 percentile latency (ns)": 13540465, "Max latency (ns)": 30131882, "Mean latency (ns)": 7053799, "Min duration satisfied": "Yes", "Min latency (ns)": 6125369, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 141.44, "QPS w/o loadgen overhead": 141.77, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.579815, "characteristics.90th_percentile_latency_ns": 9579815.0, "characteristics.90th_percentile_latency_s": 0.009579815, "characteristics.90th_percentile_latency_us": 9579.815, "characteristics.accuracy": 55.51, "characteristics.good": 27755, "characteristics.power": 0.043164245230772884, "characteristics.power.normalized_per_core": 0.00035970204358977404, "characteristics.power.normalized_per_processor": 0.043164245230772884, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "74817a8d4a8c1ef6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15966925, "90.00 percentile latency (ns)": 18556755, "90th percentile latency (ns)": 18556755, "95.00 percentile latency (ns)": 19811995, "97.00 percentile latency (ns)": 20260376, "99.00 percentile latency (ns)": 21669166, "99.90 percentile latency (ns)": 25443207, "Max latency (ns)": 30910570, "Mean latency (ns)": 16502016, "Min duration satisfied": "Yes", "Min latency (ns)": 15377842, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 60.54, "QPS w/o loadgen overhead": 60.6, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.556755, "characteristics.90th_percentile_latency_ns": 18556755.0, "characteristics.90th_percentile_latency_s": 0.018556755, "characteristics.90th_percentile_latency_us": 18556.755, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.power": 0.09487451390414452, "characteristics.power.normalized_per_core": 0.0007906209492012043, "characteristics.power.normalized_per_processor": 0.09487451390414452, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-armnn-v21.02-neon", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c75f69c1412c902d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 688589520, "90.00 percentile latency (ns)": 689064385, "90th percentile latency (ns)": 689064385, "95.00 percentile latency (ns)": 689366538, "97.00 percentile latency (ns)": 689661492, "99.00 percentile latency (ns)": 693607309, "99.90 percentile latency (ns)": 783312487, "Max latency (ns)": 800537515, "Mean latency (ns)": 689123663, "Min duration satisfied": "Yes", "Min latency (ns)": 687981346, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.45, "QPS w/o loadgen overhead": 1.45, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 689.064385, "characteristics.90th_percentile_latency_ns": 689064385.0, "characteristics.90th_percentile_latency_s": 0.689064385, "characteristics.90th_percentile_latency_us": 689064.385, "characteristics.accuracy": 78.564, "characteristics.good": 39282, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.44928, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "41960c41324e9180", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 72459133, "90.00 percentile latency (ns)": 72976454, "90th percentile latency (ns)": 72976454, "95.00 percentile latency (ns)": 73316699, "97.00 percentile latency (ns)": 73582700, "99.00 percentile latency (ns)": 74334804, "99.90 percentile latency (ns)": 129499303, "Max latency (ns)": 140231906, "Mean latency (ns)": 72676613, "Min duration satisfied": "Yes", "Min latency (ns)": 71011671, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.76, "QPS w/o loadgen overhead": 13.76, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 72.976454, "characteristics.90th_percentile_latency_ns": 72976454.0, "characteristics.90th_percentile_latency_s": 0.072976454, "characteristics.90th_percentile_latency_us": 72976.454, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.8889, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a6b869ee3617eacb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 223723938, "90.00 percentile latency (ns)": 223937514, "90th percentile latency (ns)": 223937514, "95.00 percentile latency (ns)": 224060724, "97.00 percentile latency (ns)": 224192025, "99.00 percentile latency (ns)": 224625382, "99.90 percentile latency (ns)": 301158938, "Max latency (ns)": 344373952, "Mean latency (ns)": 223905253, "Min duration satisfied": "Yes", "Min latency (ns)": 223397206, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.47, "QPS w/o loadgen overhead": 4.47, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 223.937514, "characteristics.90th_percentile_latency_ns": 223937514.0, "characteristics.90th_percentile_latency_s": 0.223937514, "characteristics.90th_percentile_latency_us": 223937.514, "characteristics.accuracy": 74.116, "characteristics.good": 37058, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.44444, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "746fe961492b8820", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 40741143, "90.00 percentile latency (ns)": 40933925, "90th percentile latency (ns)": 40933925, "95.00 percentile latency (ns)": 41080064, "97.00 percentile latency (ns)": 41374525, "99.00 percentile latency (ns)": 45124533, "99.90 percentile latency (ns)": 77756619, "Max latency (ns)": 89106764, "Mean latency (ns)": 41028545, "Min duration satisfied": "Yes", "Min latency (ns)": 40525154, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 24.36, "QPS w/o loadgen overhead": 24.37, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.933925, "characteristics.90th_percentile_latency_ns": 40933925.0, "characteristics.90th_percentile_latency_s": 0.040933925, "characteristics.90th_percentile_latency_us": 40933.925, "characteristics.accuracy": 72.894, "characteristics.good": 36447, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 23.8095, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "39afd549e096ef92", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 301629367, "90.00 percentile latency (ns)": 301883393, "90th percentile latency (ns)": 301883393, "95.00 percentile latency (ns)": 302056356, "97.00 percentile latency (ns)": 302245902, "99.00 percentile latency (ns)": 304060099, "99.90 percentile latency (ns)": 396441420, "Max latency (ns)": 414375285, "Mean latency (ns)": 301916042, "Min duration satisfied": "Yes", "Min latency (ns)": 301247026, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.31, "QPS w/o loadgen overhead": 3.31, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 301.883393, "characteristics.90th_percentile_latency_ns": 301883393.0, "characteristics.90th_percentile_latency_s": 0.301883393, "characteristics.90th_percentile_latency_us": 301883.393, "characteristics.accuracy": 74.116, "characteristics.good": 37058, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.31126, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "02aa7d9b2591d4b9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 98048657, "90.00 percentile latency (ns)": 98761221, "90th percentile latency (ns)": 98761221, "95.00 percentile latency (ns)": 99158176, "97.00 percentile latency (ns)": 99482974, "99.00 percentile latency (ns)": 101143520, "99.90 percentile latency (ns)": 180534342, "Max latency (ns)": 187476269, "Mean latency (ns)": 98436375, "Min duration satisfied": "Yes", "Min latency (ns)": 97337847, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.16, "QPS w/o loadgen overhead": 10.16, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 98.761221, "characteristics.90th_percentile_latency_ns": 98761221.0, "characteristics.90th_percentile_latency_s": 0.098761221, "characteristics.90th_percentile_latency_us": 98761.221, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.2041, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9459d816d18af120", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15348052, "90.00 percentile latency (ns)": 15793137, "90th percentile latency (ns)": 15793137, "95.00 percentile latency (ns)": 18605378, "97.00 percentile latency (ns)": 22355329, "99.00 percentile latency (ns)": 24494121, "99.90 percentile latency (ns)": 25873699, "Max latency (ns)": 37848632, "Mean latency (ns)": 15792427, "Min duration satisfied": "Yes", "Min latency (ns)": 14906471, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 63.24, "QPS w/o loadgen overhead": 63.32, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.793137, "characteristics.90th_percentile_latency_ns": 15793137.0, "characteristics.90th_percentile_latency_s": 0.015793137, "characteristics.90th_percentile_latency_us": 15793.137, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "227fae9a86e403c9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 361745630, "90.00 percentile latency (ns)": 362824084, "90th percentile latency (ns)": 362824084, "95.00 percentile latency (ns)": 363577611, "97.00 percentile latency (ns)": 364416736, "99.00 percentile latency (ns)": 365534448, "99.90 percentile latency (ns)": 453861036, "Max latency (ns)": 516532787, "Mean latency (ns)": 362145779, "Min duration satisfied": "Yes", "Min latency (ns)": 360074226, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.76, "QPS w/o loadgen overhead": 2.76, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 362.824084, "characteristics.90th_percentile_latency_ns": 362824084.0, "characteristics.90th_percentile_latency_s": 0.362824084, "characteristics.90th_percentile_latency_us": 362824.084, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.76243, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a8634abeee3401e7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 33372731, "90.00 percentile latency (ns)": 33506898, "90th percentile latency (ns)": 33506898, "95.00 percentile latency (ns)": 33584481, "97.00 percentile latency (ns)": 33686564, "99.00 percentile latency (ns)": 34287105, "99.90 percentile latency (ns)": 62396722, "Max latency (ns)": 77390696, "Mean latency (ns)": 33527760, "Min duration satisfied": "Yes", "Min latency (ns)": 33222814, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 29.81, "QPS w/o loadgen overhead": 29.83, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.506898, "characteristics.90th_percentile_latency_ns": 33506898.0, "characteristics.90th_percentile_latency_s": 0.033506898, "characteristics.90th_percentile_latency_us": 33506.898, "characteristics.accuracy": 70.33, "characteristics.good": 35165, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 29.4118, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4905b14d7ceec7cb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15168394, "90.00 percentile latency (ns)": 15340768, "90th percentile latency (ns)": 15340768, "95.00 percentile latency (ns)": 16243475, "97.00 percentile latency (ns)": 19760971, "99.00 percentile latency (ns)": 26926627, "99.90 percentile latency (ns)": 29326166, "Max latency (ns)": 39957105, "Mean latency (ns)": 15542250, "Min duration satisfied": "Yes", "Min latency (ns)": 15039478, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 64.22, "QPS w/o loadgen overhead": 64.34, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.340768, "characteristics.90th_percentile_latency_ns": 15340768.0, "characteristics.90th_percentile_latency_s": 0.015340768, "characteristics.90th_percentile_latency_us": 15340.768, "characteristics.accuracy": 64.062, "characteristics.good": 32031, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b3f94f86bc105b0c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 139205226, "90.00 percentile latency (ns)": 139828766, "90th percentile latency (ns)": 139828766, "95.00 percentile latency (ns)": 140338927, "97.00 percentile latency (ns)": 140795678, "99.00 percentile latency (ns)": 142831158, "99.90 percentile latency (ns)": 233800751, "Max latency (ns)": 254391639, "Mean latency (ns)": 139657638, "Min duration satisfied": "Yes", "Min latency (ns)": 137502669, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.16, "QPS w/o loadgen overhead": 7.16, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 139.828766, "characteristics.90th_percentile_latency_ns": 139828766.0, "characteristics.90th_percentile_latency_s": 0.139828766, "characteristics.90th_percentile_latency_us": 139828.766, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.0922, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "558b7765a00e0024", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 45113192, "90.00 percentile latency (ns)": 46361814, "90th percentile latency (ns)": 46361814, "95.00 percentile latency (ns)": 51594304, "97.00 percentile latency (ns)": 55857604, "99.00 percentile latency (ns)": 79354819, "99.90 percentile latency (ns)": 91711255, "Max latency (ns)": 98287446, "Mean latency (ns)": 46313448, "Min duration satisfied": "Yes", "Min latency (ns)": 44591115, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.58, "QPS w/o loadgen overhead": 21.59, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 46.361814, "characteristics.90th_percentile_latency_ns": 46361814.0, "characteristics.90th_percentile_latency_s": 0.046361814, "characteristics.90th_percentile_latency_us": 46361.814, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bf4a08486f9bd5be", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 27840993, "90.00 percentile latency (ns)": 28723283, "90th percentile latency (ns)": 28723283, "95.00 percentile latency (ns)": 33609857, "97.00 percentile latency (ns)": 37818892, "99.00 percentile latency (ns)": 46791418, "99.90 percentile latency (ns)": 55139195, "Max latency (ns)": 60985643, "Mean latency (ns)": 28670695, "Min duration satisfied": "Yes", "Min latency (ns)": 27327661, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.85, "QPS w/o loadgen overhead": 34.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.723283, "characteristics.90th_percentile_latency_ns": 28723283.0, "characteristics.90th_percentile_latency_s": 0.028723283, "characteristics.90th_percentile_latency_us": 28723.283, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 34.4828, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "95a9becffe4868aa", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 138083701, "90.00 percentile latency (ns)": 138268560, "90th percentile latency (ns)": 138268560, "95.00 percentile latency (ns)": 138376187, "97.00 percentile latency (ns)": 138494583, "99.00 percentile latency (ns)": 139334355, "99.90 percentile latency (ns)": 233064800, "Max latency (ns)": 241204705, "Mean latency (ns)": 138377900, "Min duration satisfied": "Yes", "Min latency (ns)": 137799898, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.23, "QPS w/o loadgen overhead": 7.23, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 138.26856, "characteristics.90th_percentile_latency_ns": 138268560.0, "characteristics.90th_percentile_latency_s": 0.13826856, "characteristics.90th_percentile_latency_us": 138268.56, "characteristics.accuracy": 71.254, "characteristics.good": 35627, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.19424, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2ab6a9e00495480c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 209859952, "90.00 percentile latency (ns)": 210661185, "90th percentile latency (ns)": 210661185, "95.00 percentile latency (ns)": 211107195, "97.00 percentile latency (ns)": 211736573, "99.00 percentile latency (ns)": 213167779, "99.90 percentile latency (ns)": 326696120, "Max latency (ns)": 350033695, "Mean latency (ns)": 210189286, "Min duration satisfied": "Yes", "Min latency (ns)": 208051609, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.76, "QPS w/o loadgen overhead": 4.76, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 210.661185, "characteristics.90th_percentile_latency_ns": 210661185.0, "characteristics.90th_percentile_latency_s": 0.210661185, "characteristics.90th_percentile_latency_us": 210661.185, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.7619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f377856618c47019", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 24109753, "90.00 percentile latency (ns)": 24735684, "90th percentile latency (ns)": 24735684, "95.00 percentile latency (ns)": 28782290, "97.00 percentile latency (ns)": 33460043, "99.00 percentile latency (ns)": 39741967, "99.90 percentile latency (ns)": 44524453, "Max latency (ns)": 53896527, "Mean latency (ns)": 24792305, "Min duration satisfied": "Yes", "Min latency (ns)": 23703203, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 40.3, "QPS w/o loadgen overhead": 40.34, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.735684, "characteristics.90th_percentile_latency_ns": 24735684.0, "characteristics.90th_percentile_latency_s": 0.024735684, "characteristics.90th_percentile_latency_us": 24735.684, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "77348e182af16ea3", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 414238981, "90.00 percentile latency (ns)": 414618820, "90th percentile latency (ns)": 414618820, "95.00 percentile latency (ns)": 414882080, "97.00 percentile latency (ns)": 415104228, "99.00 percentile latency (ns)": 418652669, "99.90 percentile latency (ns)": 491298325, "Max latency (ns)": 492367215, "Mean latency (ns)": 414563305, "Min duration satisfied": "Yes", "Min latency (ns)": 413679865, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.41, "QPS w/o loadgen overhead": 2.41, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 414.61882, "characteristics.90th_percentile_latency_ns": 414618820.0, "characteristics.90th_percentile_latency_s": 0.41461882, "characteristics.90th_percentile_latency_us": 414618.82, "characteristics.accuracy": 76.348, "characteristics.good": 38174, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.39808, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c5bced3a1b11452f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 57709161, "90.00 percentile latency (ns)": 58421697, "90th percentile latency (ns)": 58421697, "95.00 percentile latency (ns)": 58727357, "97.00 percentile latency (ns)": 59152038, "99.00 percentile latency (ns)": 82368088, "99.90 percentile latency (ns)": 111624627, "Max latency (ns)": 121880159, "Mean latency (ns)": 58334815, "Min duration satisfied": "Yes", "Min latency (ns)": 57261462, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.14, "QPS w/o loadgen overhead": 17.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 58.421697, "characteristics.90th_percentile_latency_ns": 58421697.0, "characteristics.90th_percentile_latency_s": 0.058421697, "characteristics.90th_percentile_latency_us": 58421.697, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "22d07809fc746499", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 38988791, "90.00 percentile latency (ns)": 40207956, "90th percentile latency (ns)": 40207956, "95.00 percentile latency (ns)": 47062410, "97.00 percentile latency (ns)": 53708931, "99.00 percentile latency (ns)": 68143509, "99.90 percentile latency (ns)": 74824377, "Max latency (ns)": 79010661, "Mean latency (ns)": 40167476, "Min duration satisfied": "Yes", "Min latency (ns)": 38315356, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 24.88, "QPS w/o loadgen overhead": 24.9, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.207956, "characteristics.90th_percentile_latency_ns": 40207956.0, "characteristics.90th_percentile_latency_s": 0.040207956, "characteristics.90th_percentile_latency_us": 40207.956, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 24.3902, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "91cf41b8b67a6468", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 582452195, "90.00 percentile latency (ns)": 587150887, "90th percentile latency (ns)": 587150887, "95.00 percentile latency (ns)": 591833086, "97.00 percentile latency (ns)": 593263107, "99.00 percentile latency (ns)": 594836677, "99.90 percentile latency (ns)": 596362554, "Max latency (ns)": 597205340, "Mean latency (ns)": 581859903, "Min duration satisfied": "Yes", "Min latency (ns)": 574840061, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.72, "QPS w/o loadgen overhead": 1.72, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 587.150887, "characteristics.90th_percentile_latency_ns": 587150887.0, "characteristics.90th_percentile_latency_s": 0.587150887, "characteristics.90th_percentile_latency_us": 587150.887, "characteristics.accuracy": 78.536, "characteristics.good": 39268, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.72117, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e4a66a9bc018051b", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 92077203, "90.00 percentile latency (ns)": 92771952, "90th percentile latency (ns)": 92771952, "95.00 percentile latency (ns)": 93167743, "97.00 percentile latency (ns)": 93535242, "99.00 percentile latency (ns)": 98509314, "99.90 percentile latency (ns)": 112348865, "Max latency (ns)": 124231922, "Mean latency (ns)": 92277982, "Min duration satisfied": "Yes", "Min latency (ns)": 83433724, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.82, "QPS w/o loadgen overhead": 10.84, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 92.771952, "characteristics.90th_percentile_latency_ns": 92771952.0, "characteristics.90th_percentile_latency_s": 0.092771952, "characteristics.90th_percentile_latency_us": 92771.952, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.7527, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6dbebc6835bcd2b3", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 171351700, "90.00 percentile latency (ns)": 179311509, "90th percentile latency (ns)": 179311509, "95.00 percentile latency (ns)": 180673320, "97.00 percentile latency (ns)": 181214994, "99.00 percentile latency (ns)": 185328367, "99.90 percentile latency (ns)": 186856061, "Max latency (ns)": 193018412, "Mean latency (ns)": 172779793, "Min duration satisfied": "Yes", "Min latency (ns)": 170227294, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.78, "QPS w/o loadgen overhead": 5.79, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 179.311509, "characteristics.90th_percentile_latency_ns": 179311509.0, "characteristics.90th_percentile_latency_s": 0.179311509, "characteristics.90th_percentile_latency_us": 179311.509, "characteristics.accuracy": 74.138, "characteristics.good": 37069, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 5.74713, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "60ae4aa345d6965f", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 61462501, "90.00 percentile latency (ns)": 62036500, "90th percentile latency (ns)": 62036500, "95.00 percentile latency (ns)": 62339604, "97.00 percentile latency (ns)": 62889374, "99.00 percentile latency (ns)": 69332860, "99.90 percentile latency (ns)": 76950550, "Max latency (ns)": 82938745, "Mean latency (ns)": 61533094, "Min duration satisfied": "Yes", "Min latency (ns)": 59900628, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.23, "QPS w/o loadgen overhead": 16.25, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 62.0365, "characteristics.90th_percentile_latency_ns": 62036500.0, "characteristics.90th_percentile_latency_s": 0.0620365, "characteristics.90th_percentile_latency_us": 62036.5, "characteristics.accuracy": 72.892, "characteristics.good": 36446, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.129, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5f52161d4be89929", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 242964773, "90.00 percentile latency (ns)": 250363761, "90th percentile latency (ns)": 250363761, "95.00 percentile latency (ns)": 251922711, "97.00 percentile latency (ns)": 252718379, "99.00 percentile latency (ns)": 255873912, "99.90 percentile latency (ns)": 259843487, "Max latency (ns)": 262103022, "Mean latency (ns)": 244151395, "Min duration satisfied": "Yes", "Min latency (ns)": 238520954, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.09, "QPS w/o loadgen overhead": 4.1, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 250.363761, "characteristics.90th_percentile_latency_ns": 250363761.0, "characteristics.90th_percentile_latency_s": 0.250363761, "characteristics.90th_percentile_latency_us": 250363.761, "characteristics.accuracy": 74.13, "characteristics.good": 37065, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.08163, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "72c14fad971d3b25", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 133440668, "90.00 percentile latency (ns)": 134415082, "90th percentile latency (ns)": 134415082, "95.00 percentile latency (ns)": 134876234, "97.00 percentile latency (ns)": 135531942, "99.00 percentile latency (ns)": 140712298, "99.90 percentile latency (ns)": 148119463, "Max latency (ns)": 157122873, "Mean latency (ns)": 133627930, "Min duration satisfied": "Yes", "Min latency (ns)": 123842552, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.48, "QPS w/o loadgen overhead": 7.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 134.415082, "characteristics.90th_percentile_latency_ns": 134415082.0, "characteristics.90th_percentile_latency_s": 0.134415082, "characteristics.90th_percentile_latency_us": 134415.082, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.46269, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4dbdc04bc19bee79", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 23673404, "90.00 percentile latency (ns)": 24100401, "90th percentile latency (ns)": 24100401, "95.00 percentile latency (ns)": 24410151, "97.00 percentile latency (ns)": 25348442, "99.00 percentile latency (ns)": 31527979, "99.90 percentile latency (ns)": 37282855, "Max latency (ns)": 43558932, "Mean latency (ns)": 23907616, "Min duration satisfied": "Yes", "Min latency (ns)": 23083069, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.78, "QPS w/o loadgen overhead": 41.83, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.100401, "characteristics.90th_percentile_latency_ns": 24100401.0, "characteristics.90th_percentile_latency_s": 0.024100401, "characteristics.90th_percentile_latency_us": 24100.401, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "13cafe24ed185344", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 479143617, "90.00 percentile latency (ns)": 481495572, "90th percentile latency (ns)": 481495572, "95.00 percentile latency (ns)": 482713587, "97.00 percentile latency (ns)": 484626298, "99.00 percentile latency (ns)": 489298256, "99.90 percentile latency (ns)": 505017013, "Max latency (ns)": 507408394, "Mean latency (ns)": 479205108, "Min duration satisfied": "Yes", "Min latency (ns)": 463269958, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.09, "QPS w/o loadgen overhead": 2.09, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 481.495572, "characteristics.90th_percentile_latency_ns": 481495572.0, "characteristics.90th_percentile_latency_s": 0.481495572, "characteristics.90th_percentile_latency_us": 481495.572, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.079, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ff45c3a080c5f913", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 52647317, "90.00 percentile latency (ns)": 53112259, "90th percentile latency (ns)": 53112259, "95.00 percentile latency (ns)": 53369547, "97.00 percentile latency (ns)": 53730880, "99.00 percentile latency (ns)": 61375523, "99.90 percentile latency (ns)": 67803327, "Max latency (ns)": 73487869, "Mean latency (ns)": 52855180, "Min duration satisfied": "Yes", "Min latency (ns)": 51622451, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.87, "QPS w/o loadgen overhead": 18.92, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 53.112259, "characteristics.90th_percentile_latency_ns": 53112259.0, "characteristics.90th_percentile_latency_s": 0.053112259, "characteristics.90th_percentile_latency_us": 53112.259, "characteristics.accuracy": 70.328, "characteristics.good": 35164, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.5185, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d134a9ba2adafeeb", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 25742692, "90.00 percentile latency (ns)": 26109630, "90th percentile latency (ns)": 26109630, "95.00 percentile latency (ns)": 26301544, "97.00 percentile latency (ns)": 26639591, "99.00 percentile latency (ns)": 31321132, "99.90 percentile latency (ns)": 38769400, "Max latency (ns)": 44727284, "Mean latency (ns)": 25892448, "Min duration satisfied": "Yes", "Min latency (ns)": 25105151, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 38.56, "QPS w/o loadgen overhead": 38.62, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.10963, "characteristics.90th_percentile_latency_ns": 26109630.0, "characteristics.90th_percentile_latency_s": 0.02610963, "characteristics.90th_percentile_latency_us": 26109.63, "characteristics.accuracy": 64.03, "characteristics.good": 32015, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e4b41931bc7455e7", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 179136609, "90.00 percentile latency (ns)": 180590856, "90th percentile latency (ns)": 180590856, "95.00 percentile latency (ns)": 184481093, "97.00 percentile latency (ns)": 187059125, "99.00 percentile latency (ns)": 189869041, "99.90 percentile latency (ns)": 202634961, "Max latency (ns)": 209420874, "Mean latency (ns)": 179651825, "Min duration satisfied": "Yes", "Min latency (ns)": 167788053, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.56, "QPS w/o loadgen overhead": 5.57, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 180.590856, "characteristics.90th_percentile_latency_ns": 180590856.0, "characteristics.90th_percentile_latency_s": 0.180590856, "characteristics.90th_percentile_latency_us": 180590.856, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 5.55556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "80cfa4a30af4ab81", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 57573761, "90.00 percentile latency (ns)": 58055590, "90th percentile latency (ns)": 58055590, "95.00 percentile latency (ns)": 58311093, "97.00 percentile latency (ns)": 58517591, "99.00 percentile latency (ns)": 59307710, "99.90 percentile latency (ns)": 71634408, "Max latency (ns)": 81538722, "Mean latency (ns)": 55470660, "Min duration satisfied": "Yes", "Min latency (ns)": 49126229, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.0, "QPS w/o loadgen overhead": 18.03, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 58.05559, "characteristics.90th_percentile_latency_ns": 58055590.0, "characteristics.90th_percentile_latency_s": 0.05805559, "characteristics.90th_percentile_latency_us": 58055.59, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 19.2308, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2400945bc8bd8fec", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 26218791, "90.00 percentile latency (ns)": 26676717, "90th percentile latency (ns)": 26676717, "95.00 percentile latency (ns)": 26966907, "97.00 percentile latency (ns)": 27291254, "99.00 percentile latency (ns)": 29219156, "99.90 percentile latency (ns)": 40298115, "Max latency (ns)": 45181780, "Mean latency (ns)": 26390186, "Min duration satisfied": "Yes", "Min latency (ns)": 25638957, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 37.86, "QPS w/o loadgen overhead": 37.89, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.676717, "characteristics.90th_percentile_latency_ns": 26676717.0, "characteristics.90th_percentile_latency_s": 0.026676717, "characteristics.90th_percentile_latency_us": 26676.717, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "147298e579e4cdde", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 116801347, "90.00 percentile latency (ns)": 123030208, "90th percentile latency (ns)": 123030208, "95.00 percentile latency (ns)": 125638205, "97.00 percentile latency (ns)": 126176857, "99.00 percentile latency (ns)": 128755492, "99.90 percentile latency (ns)": 129642808, "Max latency (ns)": 130568458, "Mean latency (ns)": 117993234, "Min duration satisfied": "Yes", "Min latency (ns)": 115694068, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 8.47, "QPS w/o loadgen overhead": 8.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 123.030208, "characteristics.90th_percentile_latency_ns": 123030208.0, "characteristics.90th_percentile_latency_s": 0.123030208, "characteristics.90th_percentile_latency_us": 123030.208, "characteristics.accuracy": 71.288, "characteristics.good": 35644, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 8.40336, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "37246a38c408538f", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 265083697, "90.00 percentile latency (ns)": 270864146, "90th percentile latency (ns)": 270864146, "95.00 percentile latency (ns)": 273176295, "97.00 percentile latency (ns)": 273820128, "99.00 percentile latency (ns)": 279520044, "99.90 percentile latency (ns)": 289131953, "Max latency (ns)": 296748355, "Mean latency (ns)": 265928345, "Min duration satisfied": "Yes", "Min latency (ns)": 251569204, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.76, "QPS w/o loadgen overhead": 3.76, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 270.864146, "characteristics.90th_percentile_latency_ns": 270864146.0, "characteristics.90th_percentile_latency_s": 0.270864146, "characteristics.90th_percentile_latency_us": 270864.146, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.74532, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bb42cfe68fb74dd3", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 23553181, "90.00 percentile latency (ns)": 23995915, "90th percentile latency (ns)": 23995915, "95.00 percentile latency (ns)": 24275616, "97.00 percentile latency (ns)": 24552134, "99.00 percentile latency (ns)": 26091830, "99.90 percentile latency (ns)": 37893200, "Max latency (ns)": 44037752, "Mean latency (ns)": 23719199, "Min duration satisfied": "Yes", "Min latency (ns)": 23031677, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 42.11, "QPS w/o loadgen overhead": 42.16, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.995915, "characteristics.90th_percentile_latency_ns": 23995915.0, "characteristics.90th_percentile_latency_s": 0.023995915, "characteristics.90th_percentile_latency_us": 23995.915, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1ba8149dfae255e1", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 349431038, "90.00 percentile latency (ns)": 357869938, "90th percentile latency (ns)": 357869938, "95.00 percentile latency (ns)": 358950832, "97.00 percentile latency (ns)": 360467229, "99.00 percentile latency (ns)": 363381166, "99.90 percentile latency (ns)": 369977208, "Max latency (ns)": 374280230, "Mean latency (ns)": 351414817, "Min duration satisfied": "Yes", "Min latency (ns)": 347785808, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.85, "QPS w/o loadgen overhead": 2.85, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 357.869938, "characteristics.90th_percentile_latency_ns": 357869938.0, "characteristics.90th_percentile_latency_s": 0.357869938, "characteristics.90th_percentile_latency_us": 357869.938, "characteristics.accuracy": 76.338, "characteristics.good": 38169, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.84091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c9621a45fb8e4782", "use_accelerator": true, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 67700388, "90.00 percentile latency (ns)": 68163859, "90th percentile latency (ns)": 68163859, "95.00 percentile latency (ns)": 68414986, "97.00 percentile latency (ns)": 68685332, "99.00 percentile latency (ns)": 69885546, "99.90 percentile latency (ns)": 78403087, "Max latency (ns)": 84725543, "Mean latency (ns)": 67100150, "Min duration satisfied": "Yes", "Min latency (ns)": 59322575, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.88, "QPS w/o loadgen overhead": 14.9, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 68.163859, "characteristics.90th_percentile_latency_ns": 68163859.0, "characteristics.90th_percentile_latency_s": 0.068163859, "characteristics.90th_percentile_latency_us": 68163.859, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.9254, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "fd4a61c81fa4f6bb", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 67979752, "90.00 percentile latency (ns)": 68638354, "90th percentile latency (ns)": 68638354, "95.00 percentile latency (ns)": 69341562, "97.00 percentile latency (ns)": 76273872, "99.00 percentile latency (ns)": 77184159, "99.90 percentile latency (ns)": 86105627, "Max latency (ns)": 92580615, "Mean latency (ns)": 68378154, "Min duration satisfied": "Yes", "Min latency (ns)": 59628782, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.58, "QPS w/o loadgen overhead": 14.62, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 68.638354, "characteristics.90th_percentile_latency_ns": 68638354.0, "characteristics.90th_percentile_latency_s": 0.068638354, "characteristics.90th_percentile_latency_us": 68638.354, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.4928, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c27a4d212404dc34", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8983008, "90.00 percentile latency (ns)": 11994254, "90th percentile latency (ns)": 11994254, "95.00 percentile latency (ns)": 13057511, "97.00 percentile latency (ns)": 13861495, "99.00 percentile latency (ns)": 15999774, "99.90 percentile latency (ns)": 22223610, "Max latency (ns)": 31159683, "Mean latency (ns)": 9267563, "Min duration satisfied": "Yes", "Min latency (ns)": 5514868, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 107.73, "QPS w/o loadgen overhead": 107.9, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.994254, "characteristics.90th_percentile_latency_ns": 11994254.0, "characteristics.90th_percentile_latency_s": 0.011994254, "characteristics.90th_percentile_latency_us": 11994.254, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.power": 0.14762839612746328, "characteristics.power.normalized_per_core": 0.0012302366343955274, "characteristics.power.normalized_per_processor": 0.14762839612746328, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "59ef4b408e88bc11", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11663442, "90.00 percentile latency (ns)": 16997262, "90th percentile latency (ns)": 16997262, "95.00 percentile latency (ns)": 19047518, "97.00 percentile latency (ns)": 20359298, "99.00 percentile latency (ns)": 23394958, "99.90 percentile latency (ns)": 29416527, "Max latency (ns)": 40216984, "Mean latency (ns)": 12111581, "Min duration satisfied": "Yes", "Min latency (ns)": 7550552, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 82.46, "QPS w/o loadgen overhead": 82.57, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.997262, "characteristics.90th_percentile_latency_ns": 16997262.0, "characteristics.90th_percentile_latency_s": 0.016997262, "characteristics.90th_percentile_latency_us": 16997.262, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.power": 0.1882582345127124, "characteristics.power.normalized_per_core": 0.0015688186209392699, "characteristics.power.normalized_per_processor": 0.1882582345127124, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a8abc44783a72fac", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 151132999, "90.00 percentile latency (ns)": 170537284, "90th percentile latency (ns)": 170537284, "95.00 percentile latency (ns)": 180100665, "97.00 percentile latency (ns)": 185350585, "99.00 percentile latency (ns)": 202184917, "99.90 percentile latency (ns)": 237026307, "Max latency (ns)": 252815561, "Mean latency (ns)": 153860936, "Min duration satisfied": "Yes", "Min latency (ns)": 136330219, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 6.5, "QPS w/o loadgen overhead": 6.5, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 170.537284, "characteristics.90th_percentile_latency_ns": 170537284.0, "characteristics.90th_percentile_latency_s": 0.170537284, "characteristics.90th_percentile_latency_us": 170537.284, "characteristics.accuracy": 78.564, "characteristics.good": 39282, "characteristics.power": 3.107698652439596, "characteristics.power.normalized_per_core": 0.02589748877032997, "characteristics.power.normalized_per_processor": 3.107698652439596, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ceb04e435b04a53a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13266433, "90.00 percentile latency (ns)": 18690818, "90th percentile latency (ns)": 18690818, "95.00 percentile latency (ns)": 20562766, "97.00 percentile latency (ns)": 21861347, "99.00 percentile latency (ns)": 25026121, "99.90 percentile latency (ns)": 30375269, "Max latency (ns)": 51035225, "Mean latency (ns)": 13598318, "Min duration satisfied": "Yes", "Min latency (ns)": 8640547, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 73.47, "QPS w/o loadgen overhead": 73.54, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.690818, "characteristics.90th_percentile_latency_ns": 18690818.0, "characteristics.90th_percentile_latency_s": 0.018690818, "characteristics.90th_percentile_latency_us": 18690.818, "characteristics.accuracy": 63.65, "characteristics.good": 31825, "characteristics.power": 0.17947995473606168, "characteristics.power.normalized_per_core": 0.0014956662894671806, "characteristics.power.normalized_per_processor": 0.17947995473606168, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "824faa884791d91f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6490698, "90.00 percentile latency (ns)": 11561178, "90th percentile latency (ns)": 11561178, "95.00 percentile latency (ns)": 12848655, "97.00 percentile latency (ns)": 13530123, "99.00 percentile latency (ns)": 14764126, "99.90 percentile latency (ns)": 21643607, "Max latency (ns)": 44737931, "Mean latency (ns)": 7327035, "Min duration satisfied": "Yes", "Min latency (ns)": 3748058, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 136.13, "QPS w/o loadgen overhead": 136.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.561178, "characteristics.90th_percentile_latency_ns": 11561178.0, "characteristics.90th_percentile_latency_s": 0.011561178, "characteristics.90th_percentile_latency_us": 11561.178, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.power": 0.07853137640917149, "characteristics.power.normalized_per_core": 0.0006544281367430958, "characteristics.power.normalized_per_processor": 0.07853137640917149, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4edda175b1643d29", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7679081, "90.00 percentile latency (ns)": 14015577, "90th percentile latency (ns)": 14015577, "95.00 percentile latency (ns)": 15201901, "97.00 percentile latency (ns)": 15815685, "99.00 percentile latency (ns)": 17064379, "99.90 percentile latency (ns)": 24203534, "Max latency (ns)": 33243178, "Mean latency (ns)": 8555816, "Min duration satisfied": "Yes", "Min latency (ns)": 4101200, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 116.59, "QPS w/o loadgen overhead": 116.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.015577, "characteristics.90th_percentile_latency_ns": 14015577.0, "characteristics.90th_percentile_latency_s": 0.014015577, "characteristics.90th_percentile_latency_us": 14015.577, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.power": 0.09039523793186256, "characteristics.power.normalized_per_core": 0.000753293649432188, "characteristics.power.normalized_per_processor": 0.09039523793186256, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "35a67926986cd85a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10659060, "90.00 percentile latency (ns)": 17533691, "90th percentile latency (ns)": 17533691, "95.00 percentile latency (ns)": 19275623, "97.00 percentile latency (ns)": 20299732, "99.00 percentile latency (ns)": 22130854, "99.90 percentile latency (ns)": 28602887, "Max latency (ns)": 39287664, "Mean latency (ns)": 11407188, "Min duration satisfied": "Yes", "Min latency (ns)": 5671447, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 87.5, "QPS w/o loadgen overhead": 87.66, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.533691, "characteristics.90th_percentile_latency_ns": 17533691.0, "characteristics.90th_percentile_latency_s": 0.017533691, "characteristics.90th_percentile_latency_us": 17533.691, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.power": 0.127009060797053, "characteristics.power.normalized_per_core": 0.0010584088399754415, "characteristics.power.normalized_per_processor": 0.127009060797053, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ae805a0df8c84c0e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6218182, "90.00 percentile latency (ns)": 10259121, "90th percentile latency (ns)": 10259121, "95.00 percentile latency (ns)": 11311997, "97.00 percentile latency (ns)": 11898963, "99.00 percentile latency (ns)": 12937659, "99.90 percentile latency (ns)": 18460456, "Max latency (ns)": 29604754, "Mean latency (ns)": 6655081, "Min duration satisfied": "Yes", "Min latency (ns)": 3264424, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 149.94, "QPS w/o loadgen overhead": 150.26, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.259121, "characteristics.90th_percentile_latency_ns": 10259121.0, "characteristics.90th_percentile_latency_s": 0.010259121, "characteristics.90th_percentile_latency_us": 10259.121, "characteristics.accuracy": 48.114, "characteristics.good": 24057, "characteristics.power": 0.06885247359446517, "characteristics.power.normalized_per_core": 0.0005737706132872098, "characteristics.power.normalized_per_processor": 0.06885247359446517, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c5fca4f64b7580d3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16872201, "90.00 percentile latency (ns)": 19510264, "90th percentile latency (ns)": 19510264, "95.00 percentile latency (ns)": 21136758, "97.00 percentile latency (ns)": 22854075, "99.00 percentile latency (ns)": 26325928, "99.90 percentile latency (ns)": 32059952, "Max latency (ns)": 39204083, "Mean latency (ns)": 16449028, "Min duration satisfied": "Yes", "Min latency (ns)": 10445125, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 60.73, "QPS w/o loadgen overhead": 60.79, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.510264, "characteristics.90th_percentile_latency_ns": 19510264.0, "characteristics.90th_percentile_latency_s": 0.019510264, "characteristics.90th_percentile_latency_us": 19510.264, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.power": 0.2809386832813849, "characteristics.power.normalized_per_core": 0.0023411556940115407, "characteristics.power.normalized_per_processor": 0.2809386832813849, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c6264470aa60921a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6287822, "90.00 percentile latency (ns)": 10529060, "90th percentile latency (ns)": 10529060, "95.00 percentile latency (ns)": 11745112, "97.00 percentile latency (ns)": 12522363, "99.00 percentile latency (ns)": 14002234, "99.90 percentile latency (ns)": 18996719, "Max latency (ns)": 27685098, "Mean latency (ns)": 6752544, "Min duration satisfied": "Yes", "Min latency (ns)": 3771490, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 147.84, "QPS w/o loadgen overhead": 148.09, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.52906, "characteristics.90th_percentile_latency_ns": 10529060.0, "characteristics.90th_percentile_latency_s": 0.01052906, "characteristics.90th_percentile_latency_us": 10529.06, "characteristics.accuracy": 50.164, "characteristics.good": 25082, "characteristics.power": 0.07676661435927958, "characteristics.power.normalized_per_core": 0.0006397217863273297, "characteristics.power.normalized_per_processor": 0.07676661435927958, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3f01cadcc14e03b8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5407848, "90.00 percentile latency (ns)": 10552771, "90th percentile latency (ns)": 10552771, "95.00 percentile latency (ns)": 11689076, "97.00 percentile latency (ns)": 12375346, "99.00 percentile latency (ns)": 13604422, "99.90 percentile latency (ns)": 19308315, "Max latency (ns)": 28866964, "Mean latency (ns)": 6132029, "Min duration satisfied": "Yes", "Min latency (ns)": 3134662, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 162.65, "QPS w/o loadgen overhead": 163.08, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.552771, "characteristics.90th_percentile_latency_ns": 10552771.0, "characteristics.90th_percentile_latency_s": 0.010552771, "characteristics.90th_percentile_latency_us": 10552.771, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.power": 0.07284193893486465, "characteristics.power.normalized_per_core": 0.0006070161577905388, "characteristics.power.normalized_per_processor": 0.07284193893486465, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "544881b40386e958", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10641061, "90.00 percentile latency (ns)": 16721840, "90th percentile latency (ns)": 16721840, "95.00 percentile latency (ns)": 18875246, "97.00 percentile latency (ns)": 20416596, "99.00 percentile latency (ns)": 23538085, "99.90 percentile latency (ns)": 29148005, "Max latency (ns)": 37968438, "Mean latency (ns)": 11194607, "Min duration satisfied": "Yes", "Min latency (ns)": 6208791, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.19, "QPS w/o loadgen overhead": 89.33, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.72184, "characteristics.90th_percentile_latency_ns": 16721840.0, "characteristics.90th_percentile_latency_s": 0.01672184, "characteristics.90th_percentile_latency_us": 16721.84, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.power": 0.1567662464098782, "characteristics.power.normalized_per_core": 0.001306385386748985, "characteristics.power.normalized_per_processor": 0.1567662464098782, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4da17474b6692588", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 43286985, "90.00 percentile latency (ns)": 54647994, "90th percentile latency (ns)": 54647994, "95.00 percentile latency (ns)": 59504815, "97.00 percentile latency (ns)": 64602221, "99.00 percentile latency (ns)": 80422825, "99.90 percentile latency (ns)": 93267704, "Max latency (ns)": 104490340, "Mean latency (ns)": 46072718, "Min duration satisfied": "Yes", "Min latency (ns)": 41317329, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.7, "QPS w/o loadgen overhead": 21.7, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 54.647994, "characteristics.90th_percentile_latency_ns": 54647994.0, "characteristics.90th_percentile_latency_s": 0.054647994, "characteristics.90th_percentile_latency_us": 54647.994, "characteristics.accuracy": 74.116, "characteristics.good": 37058, "characteristics.power": 0.9625113875356974, "characteristics.power.normalized_per_core": 0.008020928229464146, "characteristics.power.normalized_per_processor": 0.9625113875356974, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e4aab913731b57fd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13113534, "90.00 percentile latency (ns)": 20521308, "90th percentile latency (ns)": 20521308, "95.00 percentile latency (ns)": 22677864, "97.00 percentile latency (ns)": 24033782, "99.00 percentile latency (ns)": 26206104, "99.90 percentile latency (ns)": 30798954, "Max latency (ns)": 37852900, "Mean latency (ns)": 13673921, "Min duration satisfied": "Yes", "Min latency (ns)": 7596848, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 73.04, "QPS w/o loadgen overhead": 73.13, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.521308, "characteristics.90th_percentile_latency_ns": 20521308.0, "characteristics.90th_percentile_latency_s": 0.020521308, "characteristics.90th_percentile_latency_us": 20521.308, "characteristics.accuracy": 61.948, "characteristics.good": 30974, "characteristics.power": 0.15486069182432974, "characteristics.power.normalized_per_core": 0.001290505765202748, "characteristics.power.normalized_per_processor": 0.15486069182432974, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0b2484d8e8f7ad65", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11732770, "90.00 percentile latency (ns)": 13838846, "90th percentile latency (ns)": 13838846, "95.00 percentile latency (ns)": 14858253, "97.00 percentile latency (ns)": 15696081, "99.00 percentile latency (ns)": 18067836, "99.90 percentile latency (ns)": 24159106, "Max latency (ns)": 38807562, "Mean latency (ns)": 11644468, "Min duration satisfied": "Yes", "Min latency (ns)": 7145915, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 85.8, "QPS w/o loadgen overhead": 85.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.838846, "characteristics.90th_percentile_latency_ns": 13838846.0, "characteristics.90th_percentile_latency_s": 0.013838846, "characteristics.90th_percentile_latency_us": 13838.846, "characteristics.accuracy": 62.264, "characteristics.good": 31132, "characteristics.power": 0.16156005902056636, "characteristics.power.normalized_per_core": 0.0013463338251713864, "characteristics.power.normalized_per_processor": 0.16156005902056636, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5f4e278c0dcbd423", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8792155, "90.00 percentile latency (ns)": 14268680, "90th percentile latency (ns)": 14268680, "95.00 percentile latency (ns)": 15791272, "97.00 percentile latency (ns)": 16606587, "99.00 percentile latency (ns)": 17911942, "99.90 percentile latency (ns)": 24310025, "Max latency (ns)": 33402072, "Mean latency (ns)": 9513778, "Min duration satisfied": "Yes", "Min latency (ns)": 5150303, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 104.93, "QPS w/o loadgen overhead": 105.11, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.26868, "characteristics.90th_percentile_latency_ns": 14268680.0, "characteristics.90th_percentile_latency_s": 0.01426868, "characteristics.90th_percentile_latency_us": 14268.68, "characteristics.accuracy": 49.19, "characteristics.good": 24595, "characteristics.power": 0.09861066107563761, "characteristics.power.normalized_per_core": 0.0008217555089636467, "characteristics.power.normalized_per_processor": 0.09861066107563761, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0be649d9b30a678a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 23532464, "90.00 percentile latency (ns)": 36884210, "90th percentile latency (ns)": 36884210, "95.00 percentile latency (ns)": 39973615, "97.00 percentile latency (ns)": 41542425, "99.00 percentile latency (ns)": 46135795, "99.90 percentile latency (ns)": 52699470, "Max latency (ns)": 61503620, "Mean latency (ns)": 26099460, "Min duration satisfied": "Yes", "Min latency (ns)": 22323514, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 38.29, "QPS w/o loadgen overhead": 38.31, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 36.88421, "characteristics.90th_percentile_latency_ns": 36884210.0, "characteristics.90th_percentile_latency_s": 0.03688421, "characteristics.90th_percentile_latency_us": 36884.21, "characteristics.accuracy": 73.556, "characteristics.good": 36778, "characteristics.power": 0.44649261162641735, "characteristics.power.normalized_per_core": 0.0037207717635534777, "characteristics.power.normalized_per_processor": 0.44649261162641735, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ea255b2673870cab", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 18198831, "90.00 percentile latency (ns)": 21170270, "90th percentile latency (ns)": 21170270, "95.00 percentile latency (ns)": 29048994, "97.00 percentile latency (ns)": 30847223, "99.00 percentile latency (ns)": 33920489, "99.90 percentile latency (ns)": 40312491, "Max latency (ns)": 50666597, "Mean latency (ns)": 19235021, "Min duration satisfied": "Yes", "Min latency (ns)": 17097826, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 51.96, "QPS w/o loadgen overhead": 51.99, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.17027, "characteristics.90th_percentile_latency_ns": 21170270.0, "characteristics.90th_percentile_latency_s": 0.02117027, "characteristics.90th_percentile_latency_us": 21170.27, "characteristics.accuracy": 70.764, "characteristics.good": 35382, "characteristics.power": 0.33813162419483167, "characteristics.power.normalized_per_core": 0.002817763534956931, "characteristics.power.normalized_per_processor": 0.33813162419483167, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4b922e2c8b7689e1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 2535082, "90.00 percentile latency (ns)": 4611238, "90th percentile latency (ns)": 4611238, "95.00 percentile latency (ns)": 5589773, "97.00 percentile latency (ns)": 6201947, "99.00 percentile latency (ns)": 7219047, "99.90 percentile latency (ns)": 9758662, "Max latency (ns)": 25979078, "Mean latency (ns)": 3110571, "Min duration satisfied": "Yes", "Min latency (ns)": 2215961, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 320.87, "QPS w/o loadgen overhead": 321.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.611238, "characteristics.90th_percentile_latency_ns": 4611238.0, "characteristics.90th_percentile_latency_s": 0.004611238, "characteristics.90th_percentile_latency_us": 4611.238, "characteristics.accuracy": 47.81, "characteristics.good": 23905, "characteristics.power": 0.040484085603961675, "characteristics.power.normalized_per_core": 0.00033736738003301394, "characteristics.power.normalized_per_processor": 0.040484085603961675, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "edf46a887b1ec56b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9405957, "90.00 percentile latency (ns)": 17171012, "90th percentile latency (ns)": 17171012, "95.00 percentile latency (ns)": 18925224, "97.00 percentile latency (ns)": 19824850, "99.00 percentile latency (ns)": 21274900, "99.90 percentile latency (ns)": 27254976, "Max latency (ns)": 45878571, "Mean latency (ns)": 10388911, "Min duration satisfied": "Yes", "Min latency (ns)": 4879248, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 96.06, "QPS w/o loadgen overhead": 96.26, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.171012, "characteristics.90th_percentile_latency_ns": 17171012.0, "characteristics.90th_percentile_latency_s": 0.017171012, "characteristics.90th_percentile_latency_us": 17171.012, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.power": 0.11763840439932148, "characteristics.power.normalized_per_core": 0.0009803200366610124, "characteristics.power.normalized_per_processor": 0.11763840439932148, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4dc39db1da38d63c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5361392, "90.00 percentile latency (ns)": 9067761, "90th percentile latency (ns)": 9067761, "95.00 percentile latency (ns)": 10013196, "97.00 percentile latency (ns)": 10606584, "99.00 percentile latency (ns)": 11850194, "99.90 percentile latency (ns)": 17501932, "Max latency (ns)": 29377603, "Mean latency (ns)": 5865697, "Min duration satisfied": "Yes", "Min latency (ns)": 3334740, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 170.06, "QPS w/o loadgen overhead": 170.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.067761, "characteristics.90th_percentile_latency_ns": 9067761.0, "characteristics.90th_percentile_latency_s": 0.009067761, "characteristics.90th_percentile_latency_us": 9067.761, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.power": 0.06777076730388153, "characteristics.power.normalized_per_core": 0.0005647563941990128, "characteristics.power.normalized_per_processor": 0.06777076730388153, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "21e4776482a83f1f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6919237, "90.00 percentile latency (ns)": 15599944, "90th percentile latency (ns)": 15599944, "95.00 percentile latency (ns)": 17980800, "97.00 percentile latency (ns)": 19431934, "99.00 percentile latency (ns)": 21772809, "99.90 percentile latency (ns)": 25766161, "Max latency (ns)": 42719727, "Mean latency (ns)": 9497371, "Min duration satisfied": "Yes", "Min latency (ns)": 6069756, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 105.16, "QPS w/o loadgen overhead": 105.29, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.599944, "characteristics.90th_percentile_latency_ns": 15599944.0, "characteristics.90th_percentile_latency_s": 0.015599944, "characteristics.90th_percentile_latency_us": 15599.944, "characteristics.accuracy": 59.232, "characteristics.good": 29616, "characteristics.power": 0.11750716395957758, "characteristics.power.normalized_per_core": 0.0009792263663298132, "characteristics.power.normalized_per_processor": 0.11750716395957758, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1b8296a14a3be2a0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 16317443, "90.00 percentile latency (ns)": 19027152, "90th percentile latency (ns)": 19027152, "95.00 percentile latency (ns)": 20185059, "97.00 percentile latency (ns)": 21225831, "99.00 percentile latency (ns)": 23643261, "99.90 percentile latency (ns)": 29167434, "Max latency (ns)": 40206319, "Mean latency (ns)": 14827747, "Min duration satisfied": "Yes", "Min latency (ns)": 10391755, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 67.39, "QPS w/o loadgen overhead": 67.44, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.027152, "characteristics.90th_percentile_latency_ns": 19027152.0, "characteristics.90th_percentile_latency_s": 0.019027152, "characteristics.90th_percentile_latency_us": 19027.152, "characteristics.accuracy": 68.212, "characteristics.good": 34106, "characteristics.power": 0.2253720172951003, "characteristics.power.normalized_per_core": 0.001878100144125836, "characteristics.power.normalized_per_processor": 0.2253720172951003, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e9ee488e942c1dc8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11612157, "90.00 percentile latency (ns)": 17841447, "90th percentile latency (ns)": 17841447, "95.00 percentile latency (ns)": 19515255, "97.00 percentile latency (ns)": 20497322, "99.00 percentile latency (ns)": 22325970, "99.90 percentile latency (ns)": 28337369, "Max latency (ns)": 40167122, "Mean latency (ns)": 12295824, "Min duration satisfied": "Yes", "Min latency (ns)": 6432357, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 81.2, "QPS w/o loadgen overhead": 81.33, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.841447, "characteristics.90th_percentile_latency_ns": 17841447.0, "characteristics.90th_percentile_latency_s": 0.017841447, "characteristics.90th_percentile_latency_us": 17841.447, "characteristics.accuracy": 59.072, "characteristics.good": 29536, "characteristics.power": 0.12881235208026703, "characteristics.power.normalized_per_core": 0.0010734362673355585, "characteristics.power.normalized_per_processor": 0.12881235208026703, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "51675c6964cb3a71", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8684828, "90.00 percentile latency (ns)": 11332547, "90th percentile latency (ns)": 11332547, "95.00 percentile latency (ns)": 12259262, "97.00 percentile latency (ns)": 13002684, "99.00 percentile latency (ns)": 14996311, "99.90 percentile latency (ns)": 21437877, "Max latency (ns)": 29964834, "Mean latency (ns)": 8971845, "Min duration satisfied": "Yes", "Min latency (ns)": 5076206, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 111.32, "QPS w/o loadgen overhead": 111.46, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.332547, "characteristics.90th_percentile_latency_ns": 11332547.0, "characteristics.90th_percentile_latency_s": 0.011332547, "characteristics.90th_percentile_latency_us": 11332.547, "characteristics.accuracy": 58.386, "characteristics.good": 29193, "characteristics.power": 0.11762951517710347, "characteristics.power.normalized_per_core": 0.0009802459598091957, "characteristics.power.normalized_per_processor": 0.11762951517710347, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "64fb4887903e775d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 25401560, "90.00 percentile latency (ns)": 28243154, "90th percentile latency (ns)": 28243154, "95.00 percentile latency (ns)": 30427206, "97.00 percentile latency (ns)": 32890097, "99.00 percentile latency (ns)": 36619795, "99.90 percentile latency (ns)": 42421804, "Max latency (ns)": 52279677, "Mean latency (ns)": 24299595, "Min duration satisfied": "Yes", "Min latency (ns)": 16664997, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.13, "QPS w/o loadgen overhead": 41.15, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.243154, "characteristics.90th_percentile_latency_ns": 28243154.0, "characteristics.90th_percentile_latency_s": 0.028243154, "characteristics.90th_percentile_latency_us": 28243.154, "characteristics.accuracy": 72.894, "characteristics.good": 36447, "characteristics.power": 0.3503341648957468, "characteristics.power.normalized_per_core": 0.0029194513741312234, "characteristics.power.normalized_per_processor": 0.3503341648957468, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a407ab1c9b8697e7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 21638757, "90.00 percentile latency (ns)": 26620502, "90th percentile latency (ns)": 26620502, "95.00 percentile latency (ns)": 28375186, "97.00 percentile latency (ns)": 29948927, "99.00 percentile latency (ns)": 33310885, "99.90 percentile latency (ns)": 39238583, "Max latency (ns)": 46940520, "Mean latency (ns)": 20779044, "Min duration satisfied": "Yes", "Min latency (ns)": 14445751, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 48.09, "QPS w/o loadgen overhead": 48.13, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.620502, "characteristics.90th_percentile_latency_ns": 26620502.0, "characteristics.90th_percentile_latency_s": 0.026620502, "characteristics.90th_percentile_latency_us": 26620.502, "characteristics.accuracy": 70.598, "characteristics.good": 35299, "characteristics.power": 0.31790656749955143, "characteristics.power.normalized_per_core": 0.0026492213958295954, "characteristics.power.normalized_per_processor": 0.31790656749955143, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 45.4545, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "71e4f6eb504201e7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12156208, "90.00 percentile latency (ns)": 19209358, "90th percentile latency (ns)": 19209358, "95.00 percentile latency (ns)": 21306625, "97.00 percentile latency (ns)": 22482206, "99.00 percentile latency (ns)": 24551728, "99.90 percentile latency (ns)": 29663169, "Max latency (ns)": 39305885, "Mean latency (ns)": 12840814, "Min duration satisfied": "Yes", "Min latency (ns)": 7168161, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 77.78, "QPS w/o loadgen overhead": 77.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.209358, "characteristics.90th_percentile_latency_ns": 19209358.0, "characteristics.90th_percentile_latency_s": 0.019209358, "characteristics.90th_percentile_latency_us": 19209.358, "characteristics.accuracy": 56.522, "characteristics.good": 28261, "characteristics.power": 0.14198038005605712, "characteristics.power.normalized_per_core": 0.001183169833800476, "characteristics.power.normalized_per_processor": 0.14198038005605712, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4c141c59738432af", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13183862, "90.00 percentile latency (ns)": 16820041, "90th percentile latency (ns)": 16820041, "95.00 percentile latency (ns)": 18348768, "97.00 percentile latency (ns)": 19682076, "99.00 percentile latency (ns)": 23300462, "99.90 percentile latency (ns)": 29537506, "Max latency (ns)": 39112014, "Mean latency (ns)": 13030530, "Min duration satisfied": "Yes", "Min latency (ns)": 9423102, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 76.67, "QPS w/o loadgen overhead": 76.74, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.820041, "characteristics.90th_percentile_latency_ns": 16820041.0, "characteristics.90th_percentile_latency_s": 0.016820041, "characteristics.90th_percentile_latency_us": 16820.041, "characteristics.accuracy": 67.726, "characteristics.good": 33863, "characteristics.power": 0.19326113948550477, "characteristics.power.normalized_per_core": 0.0016105094957125398, "characteristics.power.normalized_per_processor": 0.19326113948550477, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a0a5cb5f76f4263a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 3054078, "90.00 percentile latency (ns)": 5169718, "90th percentile latency (ns)": 5169718, "95.00 percentile latency (ns)": 5828690, "97.00 percentile latency (ns)": 6263461, "99.00 percentile latency (ns)": 7129670, "99.90 percentile latency (ns)": 13221158, "Max latency (ns)": 23021398, "Mean latency (ns)": 3453033, "Min duration satisfied": "Yes", "Min latency (ns)": 1877231, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 288.64, "QPS w/o loadgen overhead": 289.6, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.169718, "characteristics.90th_percentile_latency_ns": 5169718.0, "characteristics.90th_percentile_latency_s": 0.005169718, "characteristics.90th_percentile_latency_us": 5169.718, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.power": 0.03823666635485636, "characteristics.power.normalized_per_core": 0.00031863888629046967, "characteristics.power.normalized_per_processor": 0.03823666635485636, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bc47a1ad7493955e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5426397, "90.00 percentile latency (ns)": 8963660, "90th percentile latency (ns)": 8963660, "95.00 percentile latency (ns)": 9650953, "97.00 percentile latency (ns)": 10018776, "99.00 percentile latency (ns)": 10827514, "99.90 percentile latency (ns)": 16961716, "Max latency (ns)": 34404668, "Mean latency (ns)": 5813186, "Min duration satisfied": "Yes", "Min latency (ns)": 2712975, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 171.59, "QPS w/o loadgen overhead": 172.02, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.96366, "characteristics.90th_percentile_latency_ns": 8963660.0, "characteristics.90th_percentile_latency_s": 0.00896366, "characteristics.90th_percentile_latency_us": 8963.66, "characteristics.accuracy": 45.444, "characteristics.good": 22722, "characteristics.power": 0.05727001814444857, "characteristics.power.normalized_per_core": 0.0004772501512037381, "characteristics.power.normalized_per_processor": 0.05727001814444857, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "63364d47b3ba1f0b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13299268, "90.00 percentile latency (ns)": 16171810, "90th percentile latency (ns)": 16171810, "95.00 percentile latency (ns)": 17282483, "97.00 percentile latency (ns)": 18116479, "99.00 percentile latency (ns)": 20434741, "99.90 percentile latency (ns)": 25901646, "Max latency (ns)": 34435460, "Mean latency (ns)": 12911583, "Min duration satisfied": "Yes", "Min latency (ns)": 8315200, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 77.37, "QPS w/o loadgen overhead": 77.45, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.17181, "characteristics.90th_percentile_latency_ns": 16171810.0, "characteristics.90th_percentile_latency_s": 0.01617181, "characteristics.90th_percentile_latency_us": 16171.81, "characteristics.accuracy": 70.624, "characteristics.good": 35312, "characteristics.power": 0.22672045415181324, "characteristics.power.normalized_per_core": 0.001889337117931777, "characteristics.power.normalized_per_processor": 0.22672045415181324, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1f2498682d6e9221", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15072774, "90.00 percentile latency (ns)": 21769317, "90th percentile latency (ns)": 21769317, "95.00 percentile latency (ns)": 23889386, "97.00 percentile latency (ns)": 25166720, "99.00 percentile latency (ns)": 27691411, "99.90 percentile latency (ns)": 32850660, "Max latency (ns)": 39276564, "Mean latency (ns)": 15421278, "Min duration satisfied": "Yes", "Min latency (ns)": 7661270, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 64.77, "QPS w/o loadgen overhead": 64.85, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.769317, "characteristics.90th_percentile_latency_ns": 21769317.0, "characteristics.90th_percentile_latency_s": 0.021769317, "characteristics.90th_percentile_latency_us": 21769.317, "characteristics.accuracy": 63.442, "characteristics.good": 31721, "characteristics.power": 0.1685541786710886, "characteristics.power.normalized_per_core": 0.001404618155592405, "characteristics.power.normalized_per_processor": 0.1685541786710886, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "46696da945a99124", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14471323, "90.00 percentile latency (ns)": 22891244, "90th percentile latency (ns)": 22891244, "95.00 percentile latency (ns)": 24614615, "97.00 percentile latency (ns)": 25686247, "99.00 percentile latency (ns)": 28151314, "99.90 percentile latency (ns)": 32968805, "Max latency (ns)": 50251610, "Mean latency (ns)": 16120383, "Min duration satisfied": "Yes", "Min latency (ns)": 13768220, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 61.99, "QPS w/o loadgen overhead": 62.03, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.891244, "characteristics.90th_percentile_latency_ns": 22891244.0, "characteristics.90th_percentile_latency_s": 0.022891244, "characteristics.90th_percentile_latency_us": 22891.244, "characteristics.accuracy": 70.094, "characteristics.good": 35047, "characteristics.power": 0.26943553109830176, "characteristics.power.normalized_per_core": 0.002245296092485848, "characteristics.power.normalized_per_processor": 0.26943553109830176, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "62b2c47de9883cc7", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 65377951, "90.00 percentile latency (ns)": 80306648, "90th percentile latency (ns)": 80306648, "95.00 percentile latency (ns)": 87967292, "97.00 percentile latency (ns)": 96844419, "99.00 percentile latency (ns)": 105069029, "99.90 percentile latency (ns)": 119351638, "Max latency (ns)": 138295208, "Mean latency (ns)": 69557743, "Min duration satisfied": "Yes", "Min latency (ns)": 60440547, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.37, "QPS w/o loadgen overhead": 14.38, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 80.306648, "characteristics.90th_percentile_latency_ns": 80306648.0, "characteristics.90th_percentile_latency_s": 0.080306648, "characteristics.90th_percentile_latency_us": 80306.648, "characteristics.accuracy": 74.116, "characteristics.good": 37058, "characteristics.power": 1.354432933744286, "characteristics.power.normalized_per_core": 0.011286941114535716, "characteristics.power.normalized_per_processor": 1.354432933744286, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c44bea9ef8c75828", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7066088, "90.00 percentile latency (ns)": 9579322, "90th percentile latency (ns)": 9579322, "95.00 percentile latency (ns)": 10509169, "97.00 percentile latency (ns)": 11256520, "99.00 percentile latency (ns)": 13017091, "99.90 percentile latency (ns)": 18873305, "Max latency (ns)": 35360521, "Mean latency (ns)": 7230024, "Min duration satisfied": "Yes", "Min latency (ns)": 4456575, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 138.12, "QPS w/o loadgen overhead": 138.31, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.579322, "characteristics.90th_percentile_latency_ns": 9579322.0, "characteristics.90th_percentile_latency_s": 0.009579322, "characteristics.90th_percentile_latency_us": 9579.322, "characteristics.accuracy": 59.432, "characteristics.good": 29716, "characteristics.power": 0.0944029751691151, "characteristics.power.normalized_per_core": 0.0007866914597426258, "characteristics.power.normalized_per_processor": 0.0944029751691151, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e0b6f201f5dfbf26", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9014717, "90.00 percentile latency (ns)": 11143895, "90th percentile latency (ns)": 11143895, "95.00 percentile latency (ns)": 12035229, "97.00 percentile latency (ns)": 12752251, "99.00 percentile latency (ns)": 14712781, "99.90 percentile latency (ns)": 21330438, "Max latency (ns)": 33308893, "Mean latency (ns)": 9005844, "Min duration satisfied": "Yes", "Min latency (ns)": 5451814, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 110.92, "QPS w/o loadgen overhead": 111.04, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.143895, "characteristics.90th_percentile_latency_ns": 11143895.0, "characteristics.90th_percentile_latency_s": 0.011143895, "characteristics.90th_percentile_latency_us": 11143.895, "characteristics.accuracy": 61.458, "characteristics.good": 30729, "characteristics.power": 0.12213843111800285, "characteristics.power.normalized_per_core": 0.0010178202593166903, "characteristics.power.normalized_per_processor": 0.12213843111800285, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "084dc686311cd2bf", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15084221, "90.00 percentile latency (ns)": 22346717, "90th percentile latency (ns)": 22346717, "95.00 percentile latency (ns)": 24503903, "97.00 percentile latency (ns)": 25837850, "99.00 percentile latency (ns)": 28158624, "99.90 percentile latency (ns)": 33398184, "Max latency (ns)": 44724351, "Mean latency (ns)": 15498800, "Min duration satisfied": "Yes", "Min latency (ns)": 8422581, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 64.44, "QPS w/o loadgen overhead": 64.52, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.346717, "characteristics.90th_percentile_latency_ns": 22346717.0, "characteristics.90th_percentile_latency_s": 0.022346717, "characteristics.90th_percentile_latency_us": 22346.717, "characteristics.accuracy": 58.544, "characteristics.good": 29272, "characteristics.power": 0.17350094991002607, "characteristics.power.normalized_per_core": 0.0014458412492502173, "characteristics.power.normalized_per_processor": 0.17350094991002607, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ea89b39bbc3292bb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10269855, "90.00 percentile latency (ns)": 18819545, "90th percentile latency (ns)": 18819545, "95.00 percentile latency (ns)": 20717139, "97.00 percentile latency (ns)": 21713854, "99.00 percentile latency (ns)": 23387696, "99.90 percentile latency (ns)": 28933917, "Max latency (ns)": 41476715, "Mean latency (ns)": 11256663, "Min duration satisfied": "Yes", "Min latency (ns)": 5190813, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 88.67, "QPS w/o loadgen overhead": 88.84, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.819545, "characteristics.90th_percentile_latency_ns": 18819545.0, "characteristics.90th_percentile_latency_s": 0.018819545, "characteristics.90th_percentile_latency_us": 18819.545, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.power": 0.13060446767213904, "characteristics.power.normalized_per_core": 0.001088370563934492, "characteristics.power.normalized_per_processor": 0.13060446767213904, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ff5f2401680c7112", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 23427399, "90.00 percentile latency (ns)": 26739832, "90th percentile latency (ns)": 26739832, "95.00 percentile latency (ns)": 28830304, "97.00 percentile latency (ns)": 31265283, "99.00 percentile latency (ns)": 34962493, "99.90 percentile latency (ns)": 40453465, "Max latency (ns)": 46891204, "Mean latency (ns)": 22150857, "Min duration satisfied": "Yes", "Min latency (ns)": 14406313, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 45.11, "QPS w/o loadgen overhead": 45.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.739832, "characteristics.90th_percentile_latency_ns": 26739832.0, "characteristics.90th_percentile_latency_s": 0.026739832, "characteristics.90th_percentile_latency_us": 26739.832, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.38791699366981014, "characteristics.power.normalized_per_core": 0.0032326416139150846, "characteristics.power.normalized_per_processor": 0.38791699366981014, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6c8910ed44661b44", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 18691505, "90.00 percentile latency (ns)": 21513713, "90th percentile latency (ns)": 21513713, "95.00 percentile latency (ns)": 23185751, "97.00 percentile latency (ns)": 24707564, "99.00 percentile latency (ns)": 28369645, "99.90 percentile latency (ns)": 35173316, "Max latency (ns)": 43619398, "Mean latency (ns)": 18017033, "Min duration satisfied": "Yes", "Min latency (ns)": 12287231, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 55.46, "QPS w/o loadgen overhead": 55.5, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.513713, "characteristics.90th_percentile_latency_ns": 21513713.0, "characteristics.90th_percentile_latency_s": 0.021513713, "characteristics.90th_percentile_latency_us": 21513.713, "characteristics.accuracy": 69.678, "characteristics.good": 34839, "characteristics.power": 0.2622627459535868, "characteristics.power.normalized_per_core": 0.0021855228829465567, "characteristics.power.normalized_per_processor": 0.2622627459535868, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "64114e2487b5e2e2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11188799, "90.00 percentile latency (ns)": 13809618, "90th percentile latency (ns)": 13809618, "95.00 percentile latency (ns)": 14956993, "97.00 percentile latency (ns)": 15801505, "99.00 percentile latency (ns)": 18243535, "99.90 percentile latency (ns)": 24507805, "Max latency (ns)": 40071028, "Mean latency (ns)": 11141577, "Min duration satisfied": "Yes", "Min latency (ns)": 6739135, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.64, "QPS w/o loadgen overhead": 89.75, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.809618, "characteristics.90th_percentile_latency_ns": 13809618.0, "characteristics.90th_percentile_latency_s": 0.013809618, "characteristics.90th_percentile_latency_us": 13809.618, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.power": 0.18498608376513612, "characteristics.power.normalized_per_core": 0.001541550698042801, "characteristics.power.normalized_per_processor": 0.18498608376513612, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "47a38bb4d4fb49ea", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 18166482, "90.00 percentile latency (ns)": 22564149, "90th percentile latency (ns)": 22564149, "95.00 percentile latency (ns)": 24078395, "97.00 percentile latency (ns)": 25632547, "99.00 percentile latency (ns)": 29076928, "99.90 percentile latency (ns)": 35207230, "Max latency (ns)": 44361745, "Mean latency (ns)": 17517179, "Min duration satisfied": "Yes", "Min latency (ns)": 12362604, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.04, "QPS w/o loadgen overhead": 57.09, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.564149, "characteristics.90th_percentile_latency_ns": 22564149.0, "characteristics.90th_percentile_latency_s": 0.022564149, "characteristics.90th_percentile_latency_us": 22564.149, "characteristics.accuracy": 68.76, "characteristics.good": 34380, "characteristics.power": 0.2686167850539811, "characteristics.power.normalized_per_core": 0.002238473208783176, "characteristics.power.normalized_per_processor": 0.2686167850539811, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4834bd1b9989ee5d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6707135, "90.00 percentile latency (ns)": 7869873, "90th percentile latency (ns)": 7869873, "95.00 percentile latency (ns)": 8294242, "97.00 percentile latency (ns)": 8671345, "99.00 percentile latency (ns)": 10425309, "99.90 percentile latency (ns)": 18044612, "Max latency (ns)": 25348957, "Mean latency (ns)": 6666517, "Min duration satisfied": "Yes", "Min latency (ns)": 4439390, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 149.7, "QPS w/o loadgen overhead": 150.0, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.869873, "characteristics.90th_percentile_latency_ns": 7869873.0, "characteristics.90th_percentile_latency_s": 0.007869873, "characteristics.90th_percentile_latency_us": 7869.873, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.power": 0.09462673373368684, "characteristics.power.normalized_per_core": 0.0007885561144473903, "characteristics.power.normalized_per_processor": 0.09462673373368684, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "402bb4115e87dc69", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 4374033, "90.00 percentile latency (ns)": 8984164, "90th percentile latency (ns)": 8984164, "95.00 percentile latency (ns)": 9932393, "97.00 percentile latency (ns)": 10452030, "99.00 percentile latency (ns)": 11288008, "99.90 percentile latency (ns)": 16996958, "Max latency (ns)": 26221169, "Mean latency (ns)": 5105663, "Min duration satisfied": "Yes", "Min latency (ns)": 2476708, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 195.21, "QPS w/o loadgen overhead": 195.86, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.984164, "characteristics.90th_percentile_latency_ns": 8984164.0, "characteristics.90th_percentile_latency_s": 0.008984164, "characteristics.90th_percentile_latency_us": 8984.164, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.power": 0.05785452291425468, "characteristics.power.normalized_per_core": 0.00048212102428545566, "characteristics.power.normalized_per_processor": 0.05785452291425468, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dcf77729466e8ed5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10918483, "90.00 percentile latency (ns)": 17930653, "90th percentile latency (ns)": 17930653, "95.00 percentile latency (ns)": 19243012, "97.00 percentile latency (ns)": 20145318, "99.00 percentile latency (ns)": 22033948, "99.90 percentile latency (ns)": 26693424, "Max latency (ns)": 39431369, "Mean latency (ns)": 12603950, "Min duration satisfied": "Yes", "Min latency (ns)": 10383085, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 79.23, "QPS w/o loadgen overhead": 79.34, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.930653, "characteristics.90th_percentile_latency_ns": 17930653.0, "characteristics.90th_percentile_latency_s": 0.017930653, "characteristics.90th_percentile_latency_us": 17930.653, "characteristics.accuracy": 71.674, "characteristics.good": 35837, "characteristics.power": 0.2580203689773608, "characteristics.power.normalized_per_core": 0.0021501697414780065, "characteristics.power.normalized_per_processor": 0.2580203689773608, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "73474485e8c417aa", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7167125, "90.00 percentile latency (ns)": 11471660, "90th percentile latency (ns)": 11471660, "95.00 percentile latency (ns)": 12801190, "97.00 percentile latency (ns)": 13530981, "99.00 percentile latency (ns)": 14768806, "99.90 percentile latency (ns)": 21209858, "Max latency (ns)": 33246067, "Mean latency (ns)": 7829000, "Min duration satisfied": "Yes", "Min latency (ns)": 4356056, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 127.48, "QPS w/o loadgen overhead": 127.73, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.47166, "characteristics.90th_percentile_latency_ns": 11471660.0, "characteristics.90th_percentile_latency_s": 0.01147166, "characteristics.90th_percentile_latency_us": 11471.66, "characteristics.accuracy": 43.454, "characteristics.good": 21727, "characteristics.power": 0.08115642469786585, "characteristics.power.normalized_per_core": 0.0006763035391488821, "characteristics.power.normalized_per_processor": 0.08115642469786585, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "32bf11234a3f5bfd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 42843911, "90.00 percentile latency (ns)": 77314084, "90th percentile latency (ns)": 77314084, "95.00 percentile latency (ns)": 81061939, "97.00 percentile latency (ns)": 83912242, "99.00 percentile latency (ns)": 91711307, "99.90 percentile latency (ns)": 99747516, "Max latency (ns)": 105543697, "Mean latency (ns)": 50065569, "Min duration satisfied": "Yes", "Min latency (ns)": 40976028, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.97, "QPS w/o loadgen overhead": 19.97, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 77.314084, "characteristics.90th_percentile_latency_ns": 77314084.0, "characteristics.90th_percentile_latency_s": 0.077314084, "characteristics.90th_percentile_latency_us": 77314.084, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.105265486356313, "characteristics.power.normalized_per_core": 0.009210545719635942, "characteristics.power.normalized_per_processor": 1.105265486356313, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "784baeb0e09e933b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 20279562, "90.00 percentile latency (ns)": 22373190, "90th percentile latency (ns)": 22373190, "95.00 percentile latency (ns)": 23832088, "97.00 percentile latency (ns)": 25654868, "99.00 percentile latency (ns)": 29569717, "99.90 percentile latency (ns)": 34922193, "Max latency (ns)": 42362597, "Mean latency (ns)": 19235794, "Min duration satisfied": "Yes", "Min latency (ns)": 12823409, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 51.95, "QPS w/o loadgen overhead": 51.99, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.37319, "characteristics.90th_percentile_latency_ns": 22373190.0, "characteristics.90th_percentile_latency_s": 0.02237319, "characteristics.90th_percentile_latency_us": 22373.19, "characteristics.accuracy": 70.33, "characteristics.good": 35165, "characteristics.power": 0.2794149824601254, "characteristics.power.normalized_per_core": 0.0023284581871677117, "characteristics.power.normalized_per_processor": 0.2794149824601254, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "94c099c234a20788", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15980051, "90.00 percentile latency (ns)": 18622335, "90th percentile latency (ns)": 18622335, "95.00 percentile latency (ns)": 20189382, "97.00 percentile latency (ns)": 21596163, "99.00 percentile latency (ns)": 25275196, "99.90 percentile latency (ns)": 31415434, "Max latency (ns)": 37507761, "Mean latency (ns)": 15500332, "Min duration satisfied": "Yes", "Min latency (ns)": 10414448, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 64.46, "QPS w/o loadgen overhead": 64.51, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.622335, "characteristics.90th_percentile_latency_ns": 18622335.0, "characteristics.90th_percentile_latency_s": 0.018622335, "characteristics.90th_percentile_latency_us": 18622.335, "characteristics.accuracy": 67.4, "characteristics.good": 33700, "characteristics.power": 0.22421060306605892, "characteristics.power.normalized_per_core": 0.0018684216922171576, "characteristics.power.normalized_per_processor": 0.22421060306605892, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9c840f5b4a780dc6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14089794, "90.00 percentile latency (ns)": 16884121, "90th percentile latency (ns)": 16884121, "95.00 percentile latency (ns)": 17998030, "97.00 percentile latency (ns)": 19002975, "99.00 percentile latency (ns)": 21325791, "99.90 percentile latency (ns)": 26789993, "Max latency (ns)": 36270027, "Mean latency (ns)": 13346982, "Min duration satisfied": "Yes", "Min latency (ns)": 9114510, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 74.86, "QPS w/o loadgen overhead": 74.92, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.884121, "characteristics.90th_percentile_latency_ns": 16884121.0, "characteristics.90th_percentile_latency_s": 0.016884121, "characteristics.90th_percentile_latency_us": 16884.121, "characteristics.accuracy": 67.208, "characteristics.good": 33604, "characteristics.power": 0.19972442222842635, "characteristics.power.normalized_per_core": 0.0016643701852368862, "characteristics.power.normalized_per_processor": 0.19972442222842635, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6a290a8df1095eaf", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8567772, "90.00 percentile latency (ns)": 12464258, "90th percentile latency (ns)": 12464258, "95.00 percentile latency (ns)": 13784093, "97.00 percentile latency (ns)": 14766151, "99.00 percentile latency (ns)": 16856141, "99.90 percentile latency (ns)": 21979679, "Max latency (ns)": 33897174, "Mean latency (ns)": 8673338, "Min duration satisfied": "Yes", "Min latency (ns)": 5023483, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 115.08, "QPS w/o loadgen overhead": 115.3, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.464258, "characteristics.90th_percentile_latency_ns": 12464258.0, "characteristics.90th_percentile_latency_s": 0.012464258, "characteristics.90th_percentile_latency_us": 12464.258, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.power": 0.11896194142472723, "characteristics.power.normalized_per_core": 0.0009913495118727268, "characteristics.power.normalized_per_processor": 0.11896194142472723, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0493782801c591a9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6953929, "90.00 percentile latency (ns)": 11605453, "90th percentile latency (ns)": 11605453, "95.00 percentile latency (ns)": 12916390, "97.00 percentile latency (ns)": 13734923, "99.00 percentile latency (ns)": 15336684, "99.90 percentile latency (ns)": 20151576, "Max latency (ns)": 29972833, "Mean latency (ns)": 7291743, "Min duration satisfied": "Yes", "Min latency (ns)": 3930822, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 136.82, "QPS w/o loadgen overhead": 137.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.605453, "characteristics.90th_percentile_latency_ns": 11605453.0, "characteristics.90th_percentile_latency_s": 0.011605453, "characteristics.90th_percentile_latency_us": 11605.453, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.power": 0.09152292759936267, "characteristics.power.normalized_per_core": 0.0007626910633280223, "characteristics.power.normalized_per_processor": 0.09152292759936267, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a28e4189deb49668", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6728828, "90.00 percentile latency (ns)": 15480466, "90th percentile latency (ns)": 15480466, "95.00 percentile latency (ns)": 17199096, "97.00 percentile latency (ns)": 18036420, "99.00 percentile latency (ns)": 19414229, "99.90 percentile latency (ns)": 24941675, "Max latency (ns)": 35664764, "Mean latency (ns)": 8675916, "Min duration satisfied": "Yes", "Min latency (ns)": 4697863, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 115.0, "QPS w/o loadgen overhead": 115.26, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.480466, "characteristics.90th_percentile_latency_ns": 15480466.0, "characteristics.90th_percentile_latency_s": 0.015480466, "characteristics.90th_percentile_latency_us": 15480.466, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.power": 0.10083200004637524, "characteristics.power.normalized_per_core": 0.000840266667053127, "characteristics.power.normalized_per_processor": 0.10083200004637524, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "356565743f7bd1d7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6655356, "90.00 percentile latency (ns)": 9213251, "90th percentile latency (ns)": 9213251, "95.00 percentile latency (ns)": 10258059, "97.00 percentile latency (ns)": 11034603, "99.00 percentile latency (ns)": 13039935, "99.90 percentile latency (ns)": 19488191, "Max latency (ns)": 32487264, "Mean latency (ns)": 6898559, "Min duration satisfied": "Yes", "Min latency (ns)": 4174210, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 144.67, "QPS w/o loadgen overhead": 144.96, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.213251, "characteristics.90th_percentile_latency_ns": 9213251.0, "characteristics.90th_percentile_latency_s": 0.009213251, "characteristics.90th_percentile_latency_us": 9213.251, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.power": 0.10836754913481268, "characteristics.power.normalized_per_core": 0.0009030629094567723, "characteristics.power.normalized_per_processor": 0.10836754913481268, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8d594414cca85435", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8312427, "90.00 percentile latency (ns)": 13158214, "90th percentile latency (ns)": 13158214, "95.00 percentile latency (ns)": 14423214, "97.00 percentile latency (ns)": 15080963, "99.00 percentile latency (ns)": 16391725, "99.90 percentile latency (ns)": 23061924, "Max latency (ns)": 32437744, "Mean latency (ns)": 8934767, "Min duration satisfied": "Yes", "Min latency (ns)": 4638805, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 111.7, "QPS w/o loadgen overhead": 111.92, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.158214, "characteristics.90th_percentile_latency_ns": 13158214.0, "characteristics.90th_percentile_latency_s": 0.013158214, "characteristics.90th_percentile_latency_us": 13158.214, "characteristics.accuracy": 49.296, "characteristics.good": 24648, "characteristics.power": 0.08968545294477523, "characteristics.power.normalized_per_core": 0.0007473787745397936, "characteristics.power.normalized_per_processor": 0.08968545294477523, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d4e909ff47e7ac45", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13132532, "90.00 percentile latency (ns)": 19934148, "90th percentile latency (ns)": 19934148, "95.00 percentile latency (ns)": 21830851, "97.00 percentile latency (ns)": 23062500, "99.00 percentile latency (ns)": 25190971, "99.90 percentile latency (ns)": 30704542, "Max latency (ns)": 37327535, "Mean latency (ns)": 13500146, "Min duration satisfied": "Yes", "Min latency (ns)": 6714481, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 73.97, "QPS w/o loadgen overhead": 74.07, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.934148, "characteristics.90th_percentile_latency_ns": 19934148.0, "characteristics.90th_percentile_latency_s": 0.019934148, "characteristics.90th_percentile_latency_us": 19934.148, "characteristics.accuracy": 62.082, "characteristics.good": 31041, "characteristics.power": 0.14626810859524625, "characteristics.power.normalized_per_core": 0.0012189009049603855, "characteristics.power.normalized_per_processor": 0.14626810859524625, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "772e4ee29aad651a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8981577, "90.00 percentile latency (ns)": 16223351, "90th percentile latency (ns)": 16223351, "95.00 percentile latency (ns)": 17168372, "97.00 percentile latency (ns)": 17699442, "99.00 percentile latency (ns)": 18855654, "99.90 percentile latency (ns)": 26407425, "Max latency (ns)": 40597409, "Mean latency (ns)": 9762244, "Min duration satisfied": "Yes", "Min latency (ns)": 4147517, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 102.19, "QPS w/o loadgen overhead": 102.44, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.223351, "characteristics.90th_percentile_latency_ns": 16223351.0, "characteristics.90th_percentile_latency_s": 0.016223351, "characteristics.90th_percentile_latency_us": 16223.351, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.power": 0.10253602625072578, "characteristics.power.normalized_per_core": 0.0008544668854227148, "characteristics.power.normalized_per_processor": 0.10253602625072578, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bd0f1bd0f4797bed", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 4952592, "90.00 percentile latency (ns)": 7597833, "90th percentile latency (ns)": 7597833, "95.00 percentile latency (ns)": 8061587, "97.00 percentile latency (ns)": 8354079, "99.00 percentile latency (ns)": 9160097, "99.90 percentile latency (ns)": 15543853, "Max latency (ns)": 26729794, "Mean latency (ns)": 5155334, "Min duration satisfied": "Yes", "Min latency (ns)": 2192828, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 193.37, "QPS w/o loadgen overhead": 193.97, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.597833, "characteristics.90th_percentile_latency_ns": 7597833.0, "characteristics.90th_percentile_latency_s": 0.007597833, "characteristics.90th_percentile_latency_us": 7597.833, "characteristics.accuracy": 42.348, "characteristics.good": 21174, "characteristics.power": 0.047483374186809, "characteristics.power.normalized_per_core": 0.000395694784890075, "characteristics.power.normalized_per_processor": 0.047483374186809, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e0eeb6c7d7b4cdea", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 19719265, "90.00 percentile latency (ns)": 24209468, "90th percentile latency (ns)": 24209468, "95.00 percentile latency (ns)": 26163714, "97.00 percentile latency (ns)": 27624309, "99.00 percentile latency (ns)": 30940732, "99.90 percentile latency (ns)": 36865110, "Max latency (ns)": 45531215, "Mean latency (ns)": 19093914, "Min duration satisfied": "Yes", "Min latency (ns)": 11692574, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 52.33, "QPS w/o loadgen overhead": 52.37, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.209468, "characteristics.90th_percentile_latency_ns": 24209468.0, "characteristics.90th_percentile_latency_s": 0.024209468, "characteristics.90th_percentile_latency_us": 24209.468, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.power": 0.33246608892838114, "characteristics.power.normalized_per_core": 0.0027705507410698427, "characteristics.power.normalized_per_processor": 0.33246608892838114, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d0f40f09bcdf248d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11759745, "90.00 percentile latency (ns)": 13779228, "90th percentile latency (ns)": 13779228, "95.00 percentile latency (ns)": 14434877, "97.00 percentile latency (ns)": 15812562, "99.00 percentile latency (ns)": 19428533, "99.90 percentile latency (ns)": 26021404, "Max latency (ns)": 42721549, "Mean latency (ns)": 11554274, "Min duration satisfied": "Yes", "Min latency (ns)": 7930779, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 86.45, "QPS w/o loadgen overhead": 86.55, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.779228, "characteristics.90th_percentile_latency_ns": 13779228.0, "characteristics.90th_percentile_latency_s": 0.013779228, "characteristics.90th_percentile_latency_us": 13779.228, "characteristics.accuracy": 64.062, "characteristics.good": 32031, "characteristics.power": 0.16064595206176369, "characteristics.power.normalized_per_core": 0.001338716267181364, "characteristics.power.normalized_per_processor": 0.16064595206176369, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6df2c4aca4d76a09", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 30682885, "90.00 percentile latency (ns)": 34792199, "90th percentile latency (ns)": 34792199, "95.00 percentile latency (ns)": 37222849, "97.00 percentile latency (ns)": 39734486, "99.00 percentile latency (ns)": 43286468, "99.90 percentile latency (ns)": 48818565, "Max latency (ns)": 65067644, "Mean latency (ns)": 28829886, "Min duration satisfied": "Yes", "Min latency (ns)": 18089721, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.67, "QPS w/o loadgen overhead": 34.69, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 34.792199, "characteristics.90th_percentile_latency_ns": 34792199.0, "characteristics.90th_percentile_latency_s": 0.034792199, "characteristics.90th_percentile_latency_us": 34792.199, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.516139686898728, "characteristics.power.normalized_per_core": 0.0043011640574894, "characteristics.power.normalized_per_processor": 0.516139686898728, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d83ed0145c7a6a48", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6010461, "90.00 percentile latency (ns)": 10756071, "90th percentile latency (ns)": 10756071, "95.00 percentile latency (ns)": 11920467, "97.00 percentile latency (ns)": 12613521, "99.00 percentile latency (ns)": 13718906, "99.90 percentile latency (ns)": 18756269, "Max latency (ns)": 35290755, "Mean latency (ns)": 6516395, "Min duration satisfied": "Yes", "Min latency (ns)": 3244872, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 153.15, "QPS w/o loadgen overhead": 153.46, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.756071, "characteristics.90th_percentile_latency_ns": 10756071.0, "characteristics.90th_percentile_latency_s": 0.010756071, "characteristics.90th_percentile_latency_us": 10756.071, "characteristics.accuracy": 56.738, "characteristics.good": 28369, "characteristics.power": 0.07068598516506482, "characteristics.power.normalized_per_core": 0.0005890498763755401, "characteristics.power.normalized_per_processor": 0.07068598516506482, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "902413a509af4dbd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10692370, "90.00 percentile latency (ns)": 16512491, "90th percentile latency (ns)": 16512491, "95.00 percentile latency (ns)": 17999407, "97.00 percentile latency (ns)": 18819831, "99.00 percentile latency (ns)": 20293247, "99.90 percentile latency (ns)": 26068104, "Max latency (ns)": 37088692, "Mean latency (ns)": 11261197, "Min duration satisfied": "Yes", "Min latency (ns)": 5632484, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 88.65, "QPS w/o loadgen overhead": 88.8, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.512491, "characteristics.90th_percentile_latency_ns": 16512491.0, "characteristics.90th_percentile_latency_s": 0.016512491, "characteristics.90th_percentile_latency_us": 16512.491, "characteristics.accuracy": 57.054, "characteristics.good": 28527, "characteristics.power": 0.11480529354302346, "characteristics.power.normalized_per_core": 0.0009567107795251955, "characteristics.power.normalized_per_processor": 0.11480529354302346, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6451da1c08616b07", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 19989460, "90.00 percentile latency (ns)": 24490225, "90th percentile latency (ns)": 24490225, "95.00 percentile latency (ns)": 26612464, "97.00 percentile latency (ns)": 28232924, "99.00 percentile latency (ns)": 31409294, "99.90 percentile latency (ns)": 37952708, "Max latency (ns)": 45077012, "Mean latency (ns)": 18439733, "Min duration satisfied": "Yes", "Min latency (ns)": 12318420, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 54.19, "QPS w/o loadgen overhead": 54.23, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.490225, "characteristics.90th_percentile_latency_ns": 24490225.0, "characteristics.90th_percentile_latency_s": 0.024490225, "characteristics.90th_percentile_latency_us": 24490.225, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.power": 0.336757976120391, "characteristics.power.normalized_per_core": 0.002806316467669925, "characteristics.power.normalized_per_processor": 0.336757976120391, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f6419c5d804d7680", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8218933, "90.00 percentile latency (ns)": 12627343, "90th percentile latency (ns)": 12627343, "95.00 percentile latency (ns)": 13270231, "97.00 percentile latency (ns)": 13673185, "99.00 percentile latency (ns)": 14723282, "99.90 percentile latency (ns)": 22343941, "Max latency (ns)": 31051694, "Mean latency (ns)": 8366573, "Min duration satisfied": "Yes", "Min latency (ns)": 3510165, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 119.13, "QPS w/o loadgen overhead": 119.52, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.627343, "characteristics.90th_percentile_latency_ns": 12627343.0, "characteristics.90th_percentile_latency_s": 0.012627343, "characteristics.90th_percentile_latency_us": 12627.343, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.power": 0.07961057202654762, "characteristics.power.normalized_per_core": 0.0006634214335545634, "characteristics.power.normalized_per_processor": 0.07961057202654762, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3383e8c6dddb7698", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 15532437, "90.00 percentile latency (ns)": 20635328, "90th percentile latency (ns)": 20635328, "95.00 percentile latency (ns)": 22184393, "97.00 percentile latency (ns)": 23955689, "99.00 percentile latency (ns)": 28053523, "99.90 percentile latency (ns)": 34332520, "Max latency (ns)": 51188034, "Mean latency (ns)": 16106030, "Min duration satisfied": "Yes", "Min latency (ns)": 11347498, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.03, "QPS w/o loadgen overhead": 62.09, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.635328, "characteristics.90th_percentile_latency_ns": 20635328.0, "characteristics.90th_percentile_latency_s": 0.020635328, "characteristics.90th_percentile_latency_us": 20635.328, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.power": 0.25815375983852096, "characteristics.power.normalized_per_core": 0.0021512813319876744, "characteristics.power.normalized_per_processor": 0.25815375983852096, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1fce00e4d4fa7516", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7745481, "90.00 percentile latency (ns)": 9936454, "90th percentile latency (ns)": 9936454, "95.00 percentile latency (ns)": 10880278, "97.00 percentile latency (ns)": 11622670, "99.00 percentile latency (ns)": 13646061, "99.90 percentile latency (ns)": 20215803, "Max latency (ns)": 40741673, "Mean latency (ns)": 7777639, "Min duration satisfied": "Yes", "Min latency (ns)": 4640168, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 128.35, "QPS w/o loadgen overhead": 128.57, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.936454, "characteristics.90th_percentile_latency_ns": 9936454.0, "characteristics.90th_percentile_latency_s": 0.009936454, "characteristics.90th_percentile_latency_us": 9936.454, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.power": 0.12764043309673523, "characteristics.power.normalized_per_core": 0.001063670275806127, "characteristics.power.normalized_per_processor": 0.12764043309673523, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f5614a35ac68dd8b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10104410, "90.00 percentile latency (ns)": 12534049, "90th percentile latency (ns)": 12534049, "95.00 percentile latency (ns)": 13650831, "97.00 percentile latency (ns)": 14475440, "99.00 percentile latency (ns)": 16692717, "99.90 percentile latency (ns)": 22921833, "Max latency (ns)": 31015823, "Mean latency (ns)": 9883727, "Min duration satisfied": "Yes", "Min latency (ns)": 5907089, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 101.04, "QPS w/o loadgen overhead": 101.18, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.534049, "characteristics.90th_percentile_latency_ns": 12534049.0, "characteristics.90th_percentile_latency_s": 0.012534049, "characteristics.90th_percentile_latency_us": 12534.049, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.power": 0.1683543635673874, "characteristics.power.normalized_per_core": 0.0014029530297282283, "characteristics.power.normalized_per_processor": 0.1683543635673874, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "31849bf89568e622", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9437371, "90.00 percentile latency (ns)": 15100576, "90th percentile latency (ns)": 15100576, "95.00 percentile latency (ns)": 15907332, "97.00 percentile latency (ns)": 16363506, "99.00 percentile latency (ns)": 17497635, "99.90 percentile latency (ns)": 24778347, "Max latency (ns)": 34367467, "Mean latency (ns)": 9722363, "Min duration satisfied": "Yes", "Min latency (ns)": 3953152, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 102.59, "QPS w/o loadgen overhead": 102.86, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.100576, "characteristics.90th_percentile_latency_ns": 15100576.0, "characteristics.90th_percentile_latency_s": 0.015100576, "characteristics.90th_percentile_latency_us": 15100.576, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.power": 0.09665464528810697, "characteristics.power.normalized_per_core": 0.0008054553774008914, "characteristics.power.normalized_per_processor": 0.09665464528810697, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e9e18d1d8526ef7b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12898995, "90.00 percentile latency (ns)": 15371293, "90th percentile latency (ns)": 15371293, "95.00 percentile latency (ns)": 16330116, "97.00 percentile latency (ns)": 17345965, "99.00 percentile latency (ns)": 21205513, "99.90 percentile latency (ns)": 27676565, "Max latency (ns)": 43520671, "Mean latency (ns)": 12414804, "Min duration satisfied": "Yes", "Min latency (ns)": 8768201, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 80.45, "QPS w/o loadgen overhead": 80.55, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.371293, "characteristics.90th_percentile_latency_ns": 15371293.0, "characteristics.90th_percentile_latency_s": 0.015371293, "characteristics.90th_percentile_latency_us": 15371.293, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.power": 0.18543455455734167, "characteristics.power.normalized_per_core": 0.001545287954644514, "characteristics.power.normalized_per_processor": 0.18543455455734167, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4d63b13906d30ce9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11994436, "90.00 percentile latency (ns)": 18886897, "90th percentile latency (ns)": 18886897, "95.00 percentile latency (ns)": 21042154, "97.00 percentile latency (ns)": 22508853, "99.00 percentile latency (ns)": 25641520, "99.90 percentile latency (ns)": 30864784, "Max latency (ns)": 41448959, "Mean latency (ns)": 12456331, "Min duration satisfied": "Yes", "Min latency (ns)": 6964140, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 80.16, "QPS w/o loadgen overhead": 80.28, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.886897, "characteristics.90th_percentile_latency_ns": 18886897.0, "characteristics.90th_percentile_latency_s": 0.018886897, "characteristics.90th_percentile_latency_us": 18886.897, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.power": 0.17061216444972818, "characteristics.power.normalized_per_core": 0.0014217680370810682, "characteristics.power.normalized_per_processor": 0.17061216444972818, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "391a0dc41fdba8d9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 29522296, "90.00 percentile latency (ns)": 39275905, "90th percentile latency (ns)": 39275905, "95.00 percentile latency (ns)": 42337042, "97.00 percentile latency (ns)": 45395133, "99.00 percentile latency (ns)": 53001585, "99.90 percentile latency (ns)": 64958075, "Max latency (ns)": 77029680, "Mean latency (ns)": 32111771, "Min duration satisfied": "Yes", "Min latency (ns)": 27315107, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 31.13, "QPS w/o loadgen overhead": 31.14, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 39.275905, "characteristics.90th_percentile_latency_ns": 39275905.0, "characteristics.90th_percentile_latency_s": 0.039275905, "characteristics.90th_percentile_latency_us": 39275.905, "characteristics.accuracy": 71.254, "characteristics.good": 35627, "characteristics.power": 0.6394172542846585, "characteristics.power.normalized_per_core": 0.00532847711903882, "characteristics.power.normalized_per_processor": 0.6394172542846585, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9e8f29e44458931c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 27083021, "90.00 percentile latency (ns)": 49307993, "90th percentile latency (ns)": 49307993, "95.00 percentile latency (ns)": 51988858, "97.00 percentile latency (ns)": 54509321, "99.00 percentile latency (ns)": 59493648, "99.90 percentile latency (ns)": 66443721, "Max latency (ns)": 84040221, "Mean latency (ns)": 34796353, "Min duration satisfied": "Yes", "Min latency (ns)": 25253254, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 28.72, "QPS w/o loadgen overhead": 28.74, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 49.307993, "characteristics.90th_percentile_latency_ns": 49307993.0, "characteristics.90th_percentile_latency_s": 0.049307993, "characteristics.90th_percentile_latency_us": 49307.993, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 0.6955684443717224, "characteristics.power.normalized_per_core": 0.005796403703097686, "characteristics.power.normalized_per_processor": 0.6955684443717224, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "eebf44121a23747c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11700949, "90.00 percentile latency (ns)": 14226560, "90th percentile latency (ns)": 14226560, "95.00 percentile latency (ns)": 14928734, "97.00 percentile latency (ns)": 15892207, "99.00 percentile latency (ns)": 19714517, "99.90 percentile latency (ns)": 26789574, "Max latency (ns)": 38274528, "Mean latency (ns)": 11396542, "Min duration satisfied": "Yes", "Min latency (ns)": 8118944, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 87.64, "QPS w/o loadgen overhead": 87.75, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.22656, "characteristics.90th_percentile_latency_ns": 14226560.0, "characteristics.90th_percentile_latency_s": 0.01422656, "characteristics.90th_percentile_latency_us": 14226.56, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.power": 0.16715047561233956, "characteristics.power.normalized_per_core": 0.0013929206301028297, "characteristics.power.normalized_per_processor": 0.16715047561233956, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c943058b35adb709", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 87686447, "90.00 percentile latency (ns)": 104488814, "90th percentile latency (ns)": 104488814, "95.00 percentile latency (ns)": 110928094, "97.00 percentile latency (ns)": 118204491, "99.00 percentile latency (ns)": 134703492, "99.90 percentile latency (ns)": 149362659, "Max latency (ns)": 162126919, "Mean latency (ns)": 92041210, "Min duration satisfied": "Yes", "Min latency (ns)": 85916368, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.86, "QPS w/o loadgen overhead": 10.86, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 104.488814, "characteristics.90th_percentile_latency_ns": 104488814.0, "characteristics.90th_percentile_latency_s": 0.104488814, "characteristics.90th_percentile_latency_us": 104488.814, "characteristics.accuracy": 76.348, "characteristics.good": 38174, "characteristics.power": 1.8549569950873448, "characteristics.power.normalized_per_core": 0.015457974959061207, "characteristics.power.normalized_per_processor": 1.8549569950873448, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c9d1cc41e689aaf5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10295678, "90.00 percentile latency (ns)": 17612079, "90th percentile latency (ns)": 17612079, "95.00 percentile latency (ns)": 19377658, "97.00 percentile latency (ns)": 20335198, "99.00 percentile latency (ns)": 21876453, "99.90 percentile latency (ns)": 27738730, "Max latency (ns)": 39381539, "Mean latency (ns)": 11158406, "Min duration satisfied": "Yes", "Min latency (ns)": 6066265, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.48, "QPS w/o loadgen overhead": 89.62, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.612079, "characteristics.90th_percentile_latency_ns": 17612079.0, "characteristics.90th_percentile_latency_s": 0.017612079, "characteristics.90th_percentile_latency_us": 17612.079, "characteristics.accuracy": 54.504, "characteristics.good": 27252, "characteristics.power": 0.12058235949954044, "characteristics.power.normalized_per_core": 0.0010048529958295036, "characteristics.power.normalized_per_processor": 0.12058235949954044, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b69a7acff24f89d9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 4850387, "90.00 percentile latency (ns)": 7905178, "90th percentile latency (ns)": 7905178, "95.00 percentile latency (ns)": 8778825, "97.00 percentile latency (ns)": 9332885, "99.00 percentile latency (ns)": 10518793, "99.90 percentile latency (ns)": 16128796, "Max latency (ns)": 25272009, "Mean latency (ns)": 5305515, "Min duration satisfied": "Yes", "Min latency (ns)": 2809721, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 187.98, "QPS w/o loadgen overhead": 188.48, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.905178, "characteristics.90th_percentile_latency_ns": 7905178.0, "characteristics.90th_percentile_latency_s": 0.007905178, "characteristics.90th_percentile_latency_us": 7905.178, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.power": 0.05896867785213476, "characteristics.power.normalized_per_core": 0.0004914056487677897, "characteristics.power.normalized_per_processor": 0.05896867785213476, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "644adf859ef4e973", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12600869, "90.00 percentile latency (ns)": 20808840, "90th percentile latency (ns)": 20808840, "95.00 percentile latency (ns)": 22081478, "97.00 percentile latency (ns)": 23060815, "99.00 percentile latency (ns)": 25536764, "99.90 percentile latency (ns)": 31097420, "Max latency (ns)": 42036796, "Mean latency (ns)": 14913722, "Min duration satisfied": "Yes", "Min latency (ns)": 11160210, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 67.0, "QPS w/o loadgen overhead": 67.05, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.80884, "characteristics.90th_percentile_latency_ns": 20808840.0, "characteristics.90th_percentile_latency_s": 0.02080884, "characteristics.90th_percentile_latency_us": 20808.84, "characteristics.accuracy": 68.124, "characteristics.good": 34062, "characteristics.power": 0.24051813089989313, "characteristics.power.normalized_per_core": 0.0020043177574991093, "characteristics.power.normalized_per_processor": 0.24051813089989313, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1b41febe67092c1e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14847537, "90.00 percentile latency (ns)": 23767686, "90th percentile latency (ns)": 23767686, "95.00 percentile latency (ns)": 25586518, "97.00 percentile latency (ns)": 27621324, "99.00 percentile latency (ns)": 31785471, "99.90 percentile latency (ns)": 38084326, "Max latency (ns)": 49048020, "Mean latency (ns)": 18236892, "Min duration satisfied": "Yes", "Min latency (ns)": 13029893, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 54.79, "QPS w/o loadgen overhead": 54.83, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.767686, "characteristics.90th_percentile_latency_ns": 23767686.0, "characteristics.90th_percentile_latency_s": 0.023767686, "characteristics.90th_percentile_latency_us": 23767.686, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.power": 0.30125536250242607, "characteristics.power.normalized_per_core": 0.002510461354186884, "characteristics.power.normalized_per_processor": 0.30125536250242607, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4ed59d93fa4222a0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 11799930, "90.00 percentile latency (ns)": 20075981, "90th percentile latency (ns)": 20075981, "95.00 percentile latency (ns)": 21976575, "97.00 percentile latency (ns)": 23093602, "99.00 percentile latency (ns)": 25017296, "99.90 percentile latency (ns)": 30699357, "Max latency (ns)": 48894558, "Mean latency (ns)": 12554551, "Min duration satisfied": "Yes", "Min latency (ns)": 6036492, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 79.51, "QPS w/o loadgen overhead": 79.65, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.075981, "characteristics.90th_percentile_latency_ns": 20075981.0, "characteristics.90th_percentile_latency_s": 0.020075981, "characteristics.90th_percentile_latency_us": 20075.981, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.power": 0.14585342929929998, "characteristics.power.normalized_per_core": 0.0012154452441608332, "characteristics.power.normalized_per_processor": 0.14585342929929998, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "71ca8674066ba096", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12408211, "90.00 percentile latency (ns)": 14734168, "90th percentile latency (ns)": 14734168, "95.00 percentile latency (ns)": 15848200, "97.00 percentile latency (ns)": 16659306, "99.00 percentile latency (ns)": 19002830, "99.90 percentile latency (ns)": 24906860, "Max latency (ns)": 32794974, "Mean latency (ns)": 12467659, "Min duration satisfied": "Yes", "Min latency (ns)": 7373053, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 80.13, "QPS w/o loadgen overhead": 80.21, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.734168, "characteristics.90th_percentile_latency_ns": 14734168.0, "characteristics.90th_percentile_latency_s": 0.014734168, "characteristics.90th_percentile_latency_us": 14734.168, "characteristics.accuracy": 64.766, "characteristics.good": 32383, "characteristics.power": 0.17309241809168824, "characteristics.power.normalized_per_core": 0.0014424368174307354, "characteristics.power.normalized_per_processor": 0.17309241809168824, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e7a4078be59f381a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 13889707, "90.00 percentile latency (ns)": 19743511, "90th percentile latency (ns)": 19743511, "95.00 percentile latency (ns)": 21708109, "97.00 percentile latency (ns)": 23020953, "99.00 percentile latency (ns)": 25914324, "99.90 percentile latency (ns)": 32189641, "Max latency (ns)": 40929992, "Mean latency (ns)": 14088362, "Min duration satisfied": "Yes", "Min latency (ns)": 8254116, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 70.89, "QPS w/o loadgen overhead": 70.98, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.743511, "characteristics.90th_percentile_latency_ns": 19743511.0, "characteristics.90th_percentile_latency_s": 0.019743511, "characteristics.90th_percentile_latency_us": 19743.511, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.power": 0.210257694269882, "characteristics.power.normalized_per_core": 0.0017521474522490166, "characteristics.power.normalized_per_processor": 0.210257694269882, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1c9b540139a4d863", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10883087, "90.00 percentile latency (ns)": 12784177, "90th percentile latency (ns)": 12784177, "95.00 percentile latency (ns)": 13809394, "97.00 percentile latency (ns)": 14669286, "99.00 percentile latency (ns)": 17163106, "99.90 percentile latency (ns)": 23151734, "Max latency (ns)": 26638585, "Mean latency (ns)": 10170743, "Min duration satisfied": "Yes", "Min latency (ns)": 6828408, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 98.23, "QPS w/o loadgen overhead": 98.32, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.784177, "characteristics.90th_percentile_latency_ns": 12784177.0, "characteristics.90th_percentile_latency_s": 0.012784177, "characteristics.90th_percentile_latency_us": 12784.177, "characteristics.accuracy": 64.128, "characteristics.good": 32064, "characteristics.power": 0.1494889615768468, "characteristics.power.normalized_per_core": 0.0012457413464737233, "characteristics.power.normalized_per_processor": 0.1494889615768468, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "04a8aefa4a268d92", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9645589, "90.00 percentile latency (ns)": 17905724, "90th percentile latency (ns)": 17905724, "95.00 percentile latency (ns)": 19645245, "97.00 percentile latency (ns)": 20643895, "99.00 percentile latency (ns)": 22260366, "99.90 percentile latency (ns)": 27634674, "Max latency (ns)": 37594544, "Mean latency (ns)": 10766854, "Min duration satisfied": "Yes", "Min latency (ns)": 5336570, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 92.7, "QPS w/o loadgen overhead": 92.88, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.905724, "characteristics.90th_percentile_latency_ns": 17905724.0, "characteristics.90th_percentile_latency_s": 0.017905724, "characteristics.90th_percentile_latency_us": 17905.724, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.power": 0.12264577707920471, "characteristics.power.normalized_per_core": 0.001022048142326706, "characteristics.power.normalized_per_processor": 0.12264577707920471, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "149679227c5b0299", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12386914, "90.00 percentile latency (ns)": 15087873, "90th percentile latency (ns)": 15087873, "95.00 percentile latency (ns)": 15962956, "97.00 percentile latency (ns)": 16917449, "99.00 percentile latency (ns)": 20194603, "99.90 percentile latency (ns)": 26137350, "Max latency (ns)": 35598802, "Mean latency (ns)": 12353549, "Min duration satisfied": "Yes", "Min latency (ns)": 7862671, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 80.84, "QPS w/o loadgen overhead": 80.95, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.087873, "characteristics.90th_percentile_latency_ns": 15087873.0, "characteristics.90th_percentile_latency_s": 0.015087873, "characteristics.90th_percentile_latency_us": 15087.873, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.power": 0.19631371598178712, "characteristics.power.normalized_per_core": 0.0016359476331815593, "characteristics.power.normalized_per_processor": 0.19631371598178712, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0b0304d4b95920dc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 12596121, "90.00 percentile latency (ns)": 15290958, "90th percentile latency (ns)": 15290958, "95.00 percentile latency (ns)": 16760870, "97.00 percentile latency (ns)": 18043262, "99.00 percentile latency (ns)": 21356477, "99.90 percentile latency (ns)": 27168513, "Max latency (ns)": 40830782, "Mean latency (ns)": 12029284, "Min duration satisfied": "Yes", "Min latency (ns)": 8415734, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 83.04, "QPS w/o loadgen overhead": 83.13, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.290958, "characteristics.90th_percentile_latency_ns": 15290958.0, "characteristics.90th_percentile_latency_s": 0.015290958, "characteristics.90th_percentile_latency_us": 15290.958, "characteristics.accuracy": 65.004, "characteristics.good": 32502, "characteristics.power": 0.1731687119901192, "characteristics.power.normalized_per_core": 0.0014430725999176601, "characteristics.power.normalized_per_processor": 0.1731687119901192, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b4d936ff4cceb48c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 14655680, "90.00 percentile latency (ns)": 19421984, "90th percentile latency (ns)": 19421984, "95.00 percentile latency (ns)": 21406057, "97.00 percentile latency (ns)": 22819220, "99.00 percentile latency (ns)": 25854705, "99.90 percentile latency (ns)": 31995960, "Max latency (ns)": 44052452, "Mean latency (ns)": 14823898, "Min duration satisfied": "Yes", "Min latency (ns)": 9186931, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 67.39, "QPS w/o loadgen overhead": 67.46, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.421984, "characteristics.90th_percentile_latency_ns": 19421984.0, "characteristics.90th_percentile_latency_s": 0.019421984, "characteristics.90th_percentile_latency_us": 19421.984, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.power": 0.240555960346633, "characteristics.power.normalized_per_core": 0.0020046330028886086, "characteristics.power.normalized_per_processor": 0.240555960346633, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1471247e49d3e1af", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 10183070, "90.00 percentile latency (ns)": 17300442, "90th percentile latency (ns)": 17300442, "95.00 percentile latency (ns)": 19605475, "97.00 percentile latency (ns)": 21083219, "99.00 percentile latency (ns)": 23597920, "99.90 percentile latency (ns)": 29291756, "Max latency (ns)": 36881120, "Mean latency (ns)": 10983925, "Min duration satisfied": "Yes", "Min latency (ns)": 5810252, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 90.89, "QPS w/o loadgen overhead": 91.04, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.300442, "characteristics.90th_percentile_latency_ns": 17300442.0, "characteristics.90th_percentile_latency_s": 0.017300442, "characteristics.90th_percentile_latency_us": 17300.442, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.power": 0.14151065534839616, "characteristics.power.normalized_per_core": 0.0011792554612366348, "characteristics.power.normalized_per_processor": 0.14151065534839616, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c589e69a2950dc9d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6093970, "90.00 percentile latency (ns)": 10891093, "90th percentile latency (ns)": 10891093, "95.00 percentile latency (ns)": 11635021, "97.00 percentile latency (ns)": 12051141, "99.00 percentile latency (ns)": 12974913, "99.90 percentile latency (ns)": 20249160, "Max latency (ns)": 39859328, "Mean latency (ns)": 6777900, "Min duration satisfied": "Yes", "Min latency (ns)": 3185683, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 147.09, "QPS w/o loadgen overhead": 147.54, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.891093, "characteristics.90th_percentile_latency_ns": 10891093.0, "characteristics.90th_percentile_latency_s": 0.010891093, "characteristics.90th_percentile_latency_us": 10891.093, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.power": 0.06778703867368253, "characteristics.power.normalized_per_core": 0.0005648919889473544, "characteristics.power.normalized_per_processor": 0.06778703867368253, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9eeacbe0412fb0bb", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 7857212, "90.00 percentile latency (ns)": 13487044, "90th percentile latency (ns)": 13487044, "95.00 percentile latency (ns)": 15007938, "97.00 percentile latency (ns)": 15813474, "99.00 percentile latency (ns)": 17269725, "99.90 percentile latency (ns)": 23649727, "Max latency (ns)": 32825460, "Mean latency (ns)": 8684085, "Min duration satisfied": "Yes", "Min latency (ns)": 4324721, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 114.88, "QPS w/o loadgen overhead": 115.15, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.487044, "characteristics.90th_percentile_latency_ns": 13487044.0, "characteristics.90th_percentile_latency_s": 0.013487044, "characteristics.90th_percentile_latency_us": 13487.044, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.power": 0.09406033384689932, "characteristics.power.normalized_per_core": 0.0007838361153908277, "characteristics.power.normalized_per_processor": 0.09406033384689932, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "51e71b13cc73469f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 6050816, "90.00 percentile latency (ns)": 9564182, "90th percentile latency (ns)": 9564182, "95.00 percentile latency (ns)": 10878509, "97.00 percentile latency (ns)": 11809780, "99.00 percentile latency (ns)": 13629473, "99.90 percentile latency (ns)": 19156490, "Max latency (ns)": 27042139, "Mean latency (ns)": 6402536, "Min duration satisfied": "Yes", "Min latency (ns)": 3183430, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 155.76, "QPS w/o loadgen overhead": 156.19, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.564182, "characteristics.90th_percentile_latency_ns": 9564182.0, "characteristics.90th_percentile_latency_s": 0.009564182, "characteristics.90th_percentile_latency_us": 9564.182, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.power": 0.0838335591036811, "characteristics.power.normalized_per_core": 0.0006986129925306757, "characteristics.power.normalized_per_processor": 0.0838335591036811, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "72cbe0eb44bb794c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 9420405, "90.00 percentile latency (ns)": 16005155, "90th percentile latency (ns)": 16005155, "95.00 percentile latency (ns)": 17550499, "97.00 percentile latency (ns)": 18343318, "99.00 percentile latency (ns)": 19564749, "99.90 percentile latency (ns)": 25011149, "Max latency (ns)": 34015626, "Mean latency (ns)": 10219255, "Min duration satisfied": "Yes", "Min latency (ns)": 5425590, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 97.69, "QPS w/o loadgen overhead": 97.85, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.005155, "characteristics.90th_percentile_latency_ns": 16005155.0, "characteristics.90th_percentile_latency_s": 0.016005155, "characteristics.90th_percentile_latency_us": 16005.155, "characteristics.accuracy": 55.51, "characteristics.good": 27755, "characteristics.power": 0.10617015395954478, "characteristics.power.normalized_per_core": 0.0008847512829962065, "characteristics.power.normalized_per_processor": 0.10617015395954478, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "34519b3553f57cc1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 8415385, "90.00 percentile latency (ns)": 14793222, "90th percentile latency (ns)": 14793222, "95.00 percentile latency (ns)": 16483995, "97.00 percentile latency (ns)": 17565591, "99.00 percentile latency (ns)": 19298008, "99.90 percentile latency (ns)": 25717747, "Max latency (ns)": 35524418, "Mean latency (ns)": 9349264, "Min duration satisfied": "Yes", "Min latency (ns)": 4930188, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 106.74, "QPS w/o loadgen overhead": 106.96, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.793222, "characteristics.90th_percentile_latency_ns": 14793222.0, "characteristics.90th_percentile_latency_s": 0.014793222, "characteristics.90th_percentile_latency_us": 14793.222, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.power": 0.10577332658784426, "characteristics.power.normalized_per_core": 0.0008814443882320355, "characteristics.power.normalized_per_processor": 0.10577332658784426, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d43928b28087b0c1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 5935910, "90.00 percentile latency (ns)": 8821082, "90th percentile latency (ns)": 8821082, "95.00 percentile latency (ns)": 10439943, "97.00 percentile latency (ns)": 11471101, "99.00 percentile latency (ns)": 14846180, "99.90 percentile latency (ns)": 63162865, "Max latency (ns)": 77892953, "Mean latency (ns)": 6800045, "Min duration satisfied": "Yes", "Min latency (ns)": 5453908, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 146.65, "QPS w/o loadgen overhead": 147.06, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.821082, "characteristics.90th_percentile_latency_ns": 8821082.0, "characteristics.90th_percentile_latency_s": 0.008821082, "characteristics.90th_percentile_latency_us": 8821.082, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.power": 0.17531582273014484, "characteristics.power.normalized_per_core": 0.0014609651894178738, "characteristics.power.normalized_per_processor": 0.17531582273014484, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "12f3e4b579af00ca", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7387225, "90.00 percentile latency (ns)": 11862205, "90th percentile latency (ns)": 11862205, "95.00 percentile latency (ns)": 13461935, "97.00 percentile latency (ns)": 14389471, "99.00 percentile latency (ns)": 21674194, "99.90 percentile latency (ns)": 80755131, "Max latency (ns)": 134672284, "Mean latency (ns)": 8704766, "Min duration satisfied": "Yes", "Min latency (ns)": 6555471, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 114.61, "QPS w/o loadgen overhead": 114.88, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.862205, "characteristics.90th_percentile_latency_ns": 11862205.0, "characteristics.90th_percentile_latency_s": 0.011862205, "characteristics.90th_percentile_latency_us": 11862.205, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.power": 0.21944090581227585, "characteristics.power.normalized_per_core": 0.0018286742151022988, "characteristics.power.normalized_per_processor": 0.21944090581227585, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "db8be5f90945b22b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 75243435, "90.00 percentile latency (ns)": 86725299, "90th percentile latency (ns)": 86725299, "95.00 percentile latency (ns)": 89973198, "97.00 percentile latency (ns)": 93919483, "99.00 percentile latency (ns)": 109025993, "99.90 percentile latency (ns)": 152441451, "Max latency (ns)": 167181661, "Mean latency (ns)": 78134307, "Min duration satisfied": "Yes", "Min latency (ns)": 68546254, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.8, "QPS w/o loadgen overhead": 12.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 86.725299, "characteristics.90th_percentile_latency_ns": 86725299.0, "characteristics.90th_percentile_latency_s": 0.086725299, "characteristics.90th_percentile_latency_us": 86725.299, "characteristics.accuracy": 78.514, "characteristics.good": 39257, "characteristics.power": 1.6603526755178284, "characteristics.power.normalized_per_core": 0.013836272295981904, "characteristics.power.normalized_per_processor": 1.6603526755178284, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2ab6143e794b0c57", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6774996, "90.00 percentile latency (ns)": 10172041, "90th percentile latency (ns)": 10172041, "95.00 percentile latency (ns)": 12683409, "97.00 percentile latency (ns)": 13761691, "99.00 percentile latency (ns)": 16649121, "99.90 percentile latency (ns)": 68859475, "Max latency (ns)": 132311713, "Mean latency (ns)": 7716165, "Min duration satisfied": "Yes", "Min latency (ns)": 5969775, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 129.44, "QPS w/o loadgen overhead": 129.6, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.172041, "characteristics.90th_percentile_latency_ns": 10172041.0, "characteristics.90th_percentile_latency_s": 0.010172041, "characteristics.90th_percentile_latency_us": 10172.041, "characteristics.accuracy": 63.542, "characteristics.good": 31771, "characteristics.power": 0.15697650464035962, "characteristics.power.normalized_per_core": 0.0013081375386696634, "characteristics.power.normalized_per_processor": 0.15697650464035962, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d1945c3b910fa71e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2004023, "90.00 percentile latency (ns)": 2303044, "90th percentile latency (ns)": 2303044, "95.00 percentile latency (ns)": 2830940, "97.00 percentile latency (ns)": 3460407, "99.00 percentile latency (ns)": 5508911, "99.90 percentile latency (ns)": 24756120, "Max latency (ns)": 138200814, "Mean latency (ns)": 2206973, "Min duration satisfied": "Yes", "Min latency (ns)": 1673640, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 451.37, "QPS w/o loadgen overhead": 453.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.303044, "characteristics.90th_percentile_latency_ns": 2303044.0, "characteristics.90th_percentile_latency_s": 0.002303044, "characteristics.90th_percentile_latency_us": 2303.044, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.power": 0.05008112375415777, "characteristics.power.normalized_per_core": 0.00041734269795131476, "characteristics.power.normalized_per_processor": 0.05008112375415777, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "42458a2f243385e8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2312751, "90.00 percentile latency (ns)": 2690979, "90th percentile latency (ns)": 2690979, "95.00 percentile latency (ns)": 3341601, "97.00 percentile latency (ns)": 4109281, "99.00 percentile latency (ns)": 6640792, "99.90 percentile latency (ns)": 27254171, "Max latency (ns)": 135076480, "Mean latency (ns)": 2559402, "Min duration satisfied": "Yes", "Min latency (ns)": 1979805, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 388.89, "QPS w/o loadgen overhead": 390.72, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.690979, "characteristics.90th_percentile_latency_ns": 2690979.0, "characteristics.90th_percentile_latency_s": 0.002690979, "characteristics.90th_percentile_latency_us": 2690.979, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.power": 0.059463551778375, "characteristics.power.normalized_per_core": 0.000495529598153125, "characteristics.power.normalized_per_processor": 0.059463551778375, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "268f3245a4789b1d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4347462, "90.00 percentile latency (ns)": 5140074, "90th percentile latency (ns)": 5140074, "95.00 percentile latency (ns)": 6157370, "97.00 percentile latency (ns)": 7285293, "99.00 percentile latency (ns)": 10902964, "99.90 percentile latency (ns)": 46317558, "Max latency (ns)": 142162752, "Mean latency (ns)": 4747547, "Min duration satisfied": "Yes", "Min latency (ns)": 3890001, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 209.84, "QPS w/o loadgen overhead": 210.64, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.140074, "characteristics.90th_percentile_latency_ns": 5140074.0, "characteristics.90th_percentile_latency_s": 0.005140074, "characteristics.90th_percentile_latency_us": 5140.074, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.power": 0.11321546856012765, "characteristics.power.normalized_per_core": 0.0009434622380010638, "characteristics.power.normalized_per_processor": 0.11321546856012765, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d7a04e46b291e834", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2678012, "90.00 percentile latency (ns)": 3148048, "90th percentile latency (ns)": 3148048, "95.00 percentile latency (ns)": 3924948, "97.00 percentile latency (ns)": 4699321, "99.00 percentile latency (ns)": 7627039, "99.90 percentile latency (ns)": 35090875, "Max latency (ns)": 75700786, "Mean latency (ns)": 2948521, "Min duration satisfied": "Yes", "Min latency (ns)": 2251909, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 338.44, "QPS w/o loadgen overhead": 339.15, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.148048, "characteristics.90th_percentile_latency_ns": 3148048.0, "characteristics.90th_percentile_latency_s": 0.003148048, "characteristics.90th_percentile_latency_us": 3148.048, "characteristics.accuracy": 48.162, "characteristics.good": 24081, "characteristics.power": 0.05846142178675759, "characteristics.power.normalized_per_core": 0.0004871785148896466, "characteristics.power.normalized_per_processor": 0.05846142178675759, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "72259daf4f8b9f54", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12049130, "90.00 percentile latency (ns)": 14287235, "90th percentile latency (ns)": 14287235, "95.00 percentile latency (ns)": 18307725, "97.00 percentile latency (ns)": 19320947, "99.00 percentile latency (ns)": 26441360, "99.90 percentile latency (ns)": 68461158, "Max latency (ns)": 117024350, "Mean latency (ns)": 12725958, "Min duration satisfied": "Yes", "Min latency (ns)": 9931690, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 78.46, "QPS w/o loadgen overhead": 78.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.287235, "characteristics.90th_percentile_latency_ns": 14287235.0, "characteristics.90th_percentile_latency_s": 0.014287235, "characteristics.90th_percentile_latency_us": 14287.235, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.power": 0.3385805714334268, "characteristics.power.normalized_per_core": 0.0028215047619452233, "characteristics.power.normalized_per_processor": 0.3385805714334268, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3ec4b84a17bb9c10", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3086158, "90.00 percentile latency (ns)": 3818800, "90th percentile latency (ns)": 3818800, "95.00 percentile latency (ns)": 4862211, "97.00 percentile latency (ns)": 5905551, "99.00 percentile latency (ns)": 8764824, "99.90 percentile latency (ns)": 42552336, "Max latency (ns)": 80273167, "Mean latency (ns)": 3402604, "Min duration satisfied": "Yes", "Min latency (ns)": 2585241, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 293.41, "QPS w/o loadgen overhead": 293.89, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.8188, "characteristics.90th_percentile_latency_ns": 3818800.0, "characteristics.90th_percentile_latency_s": 0.0038188, "characteristics.90th_percentile_latency_us": 3818.8, "characteristics.accuracy": 50.242, "characteristics.good": 25121, "characteristics.power": 0.06820041352828235, "characteristics.power.normalized_per_core": 0.0005683367794023529, "characteristics.power.normalized_per_processor": 0.06820041352828235, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c20354009957a58a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2825661, "90.00 percentile latency (ns)": 3094634, "90th percentile latency (ns)": 3094634, "95.00 percentile latency (ns)": 3338741, "97.00 percentile latency (ns)": 4025266, "99.00 percentile latency (ns)": 6713771, "99.90 percentile latency (ns)": 30102933, "Max latency (ns)": 88748386, "Mean latency (ns)": 3032182, "Min duration satisfied": "Yes", "Min latency (ns)": 2574322, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 328.37, "QPS w/o loadgen overhead": 329.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.094634, "characteristics.90th_percentile_latency_ns": 3094634.0, "characteristics.90th_percentile_latency_s": 0.003094634, "characteristics.90th_percentile_latency_us": 3094.634, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.power": 0.07566949172328459, "characteristics.power.normalized_per_core": 0.0006305790976940382, "characteristics.power.normalized_per_processor": 0.07566949172328459, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a47328cde011d0dd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5749243, "90.00 percentile latency (ns)": 6680630, "90th percentile latency (ns)": 6680630, "95.00 percentile latency (ns)": 7778289, "97.00 percentile latency (ns)": 9178566, "99.00 percentile latency (ns)": 13542223, "99.90 percentile latency (ns)": 67815831, "Max latency (ns)": 129020392, "Mean latency (ns)": 6237201, "Min duration satisfied": "Yes", "Min latency (ns)": 5069019, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 159.86, "QPS w/o loadgen overhead": 160.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.68063, "characteristics.90th_percentile_latency_ns": 6680630.0, "characteristics.90th_percentile_latency_s": 0.00668063, "characteristics.90th_percentile_latency_us": 6680.63, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.power": 0.1592659201801576, "characteristics.power.normalized_per_core": 0.0013272160015013132, "characteristics.power.normalized_per_processor": 0.1592659201801576, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f384e48d498ab40b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21024352, "90.00 percentile latency (ns)": 29427836, "90th percentile latency (ns)": 29427836, "95.00 percentile latency (ns)": 31514149, "97.00 percentile latency (ns)": 33240893, "99.00 percentile latency (ns)": 41130339, "99.90 percentile latency (ns)": 88365544, "Max latency (ns)": 123857685, "Mean latency (ns)": 23467361, "Min duration satisfied": "Yes", "Min latency (ns)": 19119026, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 42.58, "QPS w/o loadgen overhead": 42.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.427836, "characteristics.90th_percentile_latency_ns": 29427836.0, "characteristics.90th_percentile_latency_s": 0.029427836, "characteristics.90th_percentile_latency_us": 29427.836, "characteristics.accuracy": 74.098, "characteristics.good": 37049, "characteristics.power": 0.492756550102975, "characteristics.power.normalized_per_core": 0.004106304584191458, "characteristics.power.normalized_per_processor": 0.492756550102975, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "61368c0ebc4f9db9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5403260, "90.00 percentile latency (ns)": 7857300, "90th percentile latency (ns)": 7857300, "95.00 percentile latency (ns)": 9893930, "97.00 percentile latency (ns)": 11460684, "99.00 percentile latency (ns)": 13595318, "99.90 percentile latency (ns)": 67005467, "Max latency (ns)": 145301465, "Mean latency (ns)": 6190484, "Min duration satisfied": "Yes", "Min latency (ns)": 4762398, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 161.32, "QPS w/o loadgen overhead": 161.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.8573, "characteristics.90th_percentile_latency_ns": 7857300.0, "characteristics.90th_percentile_latency_s": 0.0078573, "characteristics.90th_percentile_latency_us": 7857.3, "characteristics.accuracy": 61.924, "characteristics.good": 30962, "characteristics.power": 0.12303955600737235, "characteristics.power.normalized_per_core": 0.0010253296333947695, "characteristics.power.normalized_per_processor": 0.12303955600737235, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c540a762c4a10be3", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5363837, "90.00 percentile latency (ns)": 7716829, "90th percentile latency (ns)": 7716829, "95.00 percentile latency (ns)": 10594927, "97.00 percentile latency (ns)": 11688218, "99.00 percentile latency (ns)": 13198615, "99.90 percentile latency (ns)": 31086166, "Max latency (ns)": 75871605, "Mean latency (ns)": 6051837, "Min duration satisfied": "Yes", "Min latency (ns)": 4992792, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 165.05, "QPS w/o loadgen overhead": 165.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.716829, "characteristics.90th_percentile_latency_ns": 7716829.0, "characteristics.90th_percentile_latency_s": 0.007716829, "characteristics.90th_percentile_latency_us": 7716.829, "characteristics.accuracy": 62.298, "characteristics.good": 31149, "characteristics.power": 0.12267514071237748, "characteristics.power.normalized_per_core": 0.0010222928392698122, "characteristics.power.normalized_per_processor": 0.12267514071237748, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1997d8dc56a877fb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2733655, "90.00 percentile latency (ns)": 3013443, "90th percentile latency (ns)": 3013443, "95.00 percentile latency (ns)": 3697602, "97.00 percentile latency (ns)": 4309789, "99.00 percentile latency (ns)": 6514749, "99.90 percentile latency (ns)": 29527467, "Max latency (ns)": 117642041, "Mean latency (ns)": 2970037, "Min duration satisfied": "Yes", "Min latency (ns)": 2353831, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 335.94, "QPS w/o loadgen overhead": 336.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.013443, "characteristics.90th_percentile_latency_ns": 3013443.0, "characteristics.90th_percentile_latency_s": 0.003013443, "characteristics.90th_percentile_latency_us": 3013.443, "characteristics.accuracy": 49.12, "characteristics.good": 24560, "characteristics.power": 0.05786226146250081, "characteristics.power.normalized_per_core": 0.0004821855121875067, "characteristics.power.normalized_per_processor": 0.05786226146250081, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "355787fb48e39204", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22366278, "90.00 percentile latency (ns)": 29945726, "90th percentile latency (ns)": 29945726, "95.00 percentile latency (ns)": 32811952, "97.00 percentile latency (ns)": 36115874, "99.00 percentile latency (ns)": 45489653, "99.90 percentile latency (ns)": 121180285, "Max latency (ns)": 144259273, "Mean latency (ns)": 24517861, "Min duration satisfied": "Yes", "Min latency (ns)": 18789759, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 40.76, "QPS w/o loadgen overhead": 40.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 29.945726, "characteristics.90th_percentile_latency_ns": 29945726.0, "characteristics.90th_percentile_latency_s": 0.029945726, "characteristics.90th_percentile_latency_us": 29945.726, "characteristics.accuracy": 73.584, "characteristics.good": 36792, "characteristics.power": 0.49949908936491116, "characteristics.power.normalized_per_core": 0.00416249241137426, "characteristics.power.normalized_per_processor": 0.49949908936491116, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f47d09fc7a961206", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15252679, "90.00 percentile latency (ns)": 16077069, "90th percentile latency (ns)": 16077069, "95.00 percentile latency (ns)": 20072509, "97.00 percentile latency (ns)": 21181903, "99.00 percentile latency (ns)": 28763583, "99.90 percentile latency (ns)": 62522182, "Max latency (ns)": 92075146, "Mean latency (ns)": 15886903, "Min duration satisfied": "Yes", "Min latency (ns)": 13921162, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.89, "QPS w/o loadgen overhead": 62.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.077069, "characteristics.90th_percentile_latency_ns": 16077069.0, "characteristics.90th_percentile_latency_s": 0.016077069, "characteristics.90th_percentile_latency_us": 16077.069, "characteristics.accuracy": 70.772, "characteristics.good": 35386, "characteristics.power": 0.32702793383146855, "characteristics.power.normalized_per_core": 0.0027252327819289046, "characteristics.power.normalized_per_processor": 0.32702793383146855, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "186155d86e94dfba", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1797659, "90.00 percentile latency (ns)": 1980312, "90th percentile latency (ns)": 1980312, "95.00 percentile latency (ns)": 2217748, "97.00 percentile latency (ns)": 2738703, "99.00 percentile latency (ns)": 3926381, "99.90 percentile latency (ns)": 24750498, "Max latency (ns)": 79677783, "Mean latency (ns)": 1946044, "Min duration satisfied": "Yes", "Min latency (ns)": 1534979, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 512.4, "QPS w/o loadgen overhead": 513.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 1.980312, "characteristics.90th_percentile_latency_ns": 1980312.0, "characteristics.90th_percentile_latency_s": 0.001980312, "characteristics.90th_percentile_latency_us": 1980.312, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.power": 0.04418067430524521, "characteristics.power.normalized_per_core": 0.0003681722858770434, "characteristics.power.normalized_per_processor": 0.04418067430524521, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ae2c542b89f67a57", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3559861, "90.00 percentile latency (ns)": 5586185, "90th percentile latency (ns)": 5586185, "95.00 percentile latency (ns)": 7035301, "97.00 percentile latency (ns)": 8251032, "99.00 percentile latency (ns)": 10847462, "99.90 percentile latency (ns)": 49331373, "Max latency (ns)": 141421723, "Mean latency (ns)": 4196199, "Min duration satisfied": "Yes", "Min latency (ns)": 2889305, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 237.22, "QPS w/o loadgen overhead": 238.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.586185, "characteristics.90th_percentile_latency_ns": 5586185.0, "characteristics.90th_percentile_latency_s": 0.005586185, "characteristics.90th_percentile_latency_us": 5586.185, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.power": 0.10130546340051402, "characteristics.power.normalized_per_core": 0.0008442121950042836, "characteristics.power.normalized_per_processor": 0.10130546340051402, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ecdee4eaf8b1cb0f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2975319, "90.00 percentile latency (ns)": 3358053, "90th percentile latency (ns)": 3358053, "95.00 percentile latency (ns)": 4072648, "97.00 percentile latency (ns)": 4849000, "99.00 percentile latency (ns)": 7074087, "99.90 percentile latency (ns)": 32321754, "Max latency (ns)": 88145684, "Mean latency (ns)": 3234955, "Min duration satisfied": "Yes", "Min latency (ns)": 2635076, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 308.4, "QPS w/o loadgen overhead": 309.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.358053, "characteristics.90th_percentile_latency_ns": 3358053.0, "characteristics.90th_percentile_latency_s": 0.003358053, "characteristics.90th_percentile_latency_us": 3358.053, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.power": 0.07497716732111338, "characteristics.power.normalized_per_core": 0.0006248097276759448, "characteristics.power.normalized_per_processor": 0.07497716732111338, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1b2526894fee449f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4763392, "90.00 percentile latency (ns)": 5540407, "90th percentile latency (ns)": 5540407, "95.00 percentile latency (ns)": 6670829, "97.00 percentile latency (ns)": 7855555, "99.00 percentile latency (ns)": 11655924, "99.90 percentile latency (ns)": 43443844, "Max latency (ns)": 140267059, "Mean latency (ns)": 5145735, "Min duration satisfied": "Yes", "Min latency (ns)": 3944274, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 194.02, "QPS w/o loadgen overhead": 194.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.540407, "characteristics.90th_percentile_latency_ns": 5540407.0, "characteristics.90th_percentile_latency_s": 0.005540407, "characteristics.90th_percentile_latency_us": 5540.407, "characteristics.accuracy": 59.226, "characteristics.good": 29613, "characteristics.power": 0.10114249390097256, "characteristics.power.normalized_per_core": 0.000842854115841438, "characteristics.power.normalized_per_processor": 0.10114249390097256, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ae41589987e1a11d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9034290, "90.00 percentile latency (ns)": 11048492, "90th percentile latency (ns)": 11048492, "95.00 percentile latency (ns)": 13453560, "97.00 percentile latency (ns)": 15148707, "99.00 percentile latency (ns)": 23208907, "99.90 percentile latency (ns)": 67778382, "Max latency (ns)": 85158901, "Mean latency (ns)": 9800484, "Min duration satisfied": "Yes", "Min latency (ns)": 8152619, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 101.93, "QPS w/o loadgen overhead": 102.04, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.048492, "characteristics.90th_percentile_latency_ns": 11048492.0, "characteristics.90th_percentile_latency_s": 0.011048492, "characteristics.90th_percentile_latency_us": 11048.492, "characteristics.accuracy": 68.248, "characteristics.good": 34124, "characteristics.power": 0.19924232019411275, "characteristics.power.normalized_per_core": 0.001660352668284273, "characteristics.power.normalized_per_processor": 0.19924232019411275, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f2681f0793e46e88", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4157071, "90.00 percentile latency (ns)": 5701501, "90th percentile latency (ns)": 5701501, "95.00 percentile latency (ns)": 7414766, "97.00 percentile latency (ns)": 9101941, "99.00 percentile latency (ns)": 11934770, "99.90 percentile latency (ns)": 46184673, "Max latency (ns)": 129686422, "Mean latency (ns)": 4726920, "Min duration satisfied": "Yes", "Min latency (ns)": 3546571, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 211.23, "QPS w/o loadgen overhead": 211.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.701501, "characteristics.90th_percentile_latency_ns": 5701501.0, "characteristics.90th_percentile_latency_s": 0.005701501, "characteristics.90th_percentile_latency_us": 5701.501, "characteristics.accuracy": 59.12, "characteristics.good": 29560, "characteristics.power": 0.09315231165207719, "characteristics.power.normalized_per_core": 0.0007762692637673099, "characteristics.power.normalized_per_processor": 0.09315231165207719, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2b12e4209a88dbcf", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4275801, "90.00 percentile latency (ns)": 5040253, "90th percentile latency (ns)": 5040253, "95.00 percentile latency (ns)": 6141320, "97.00 percentile latency (ns)": 7345539, "99.00 percentile latency (ns)": 10978463, "99.90 percentile latency (ns)": 46601220, "Max latency (ns)": 77244039, "Mean latency (ns)": 4704346, "Min duration satisfied": "Yes", "Min latency (ns)": 3764706, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 212.24, "QPS w/o loadgen overhead": 212.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.040253, "characteristics.90th_percentile_latency_ns": 5040253.0, "characteristics.90th_percentile_latency_s": 0.005040253, "characteristics.90th_percentile_latency_us": 5040.253, "characteristics.accuracy": 58.46, "characteristics.good": 29230, "characteristics.power": 0.09534599195878868, "characteristics.power.normalized_per_core": 0.0007945499329899057, "characteristics.power.normalized_per_processor": 0.09534599195878868, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4886a3b44c18f830", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11896158, "90.00 percentile latency (ns)": 17880815, "90th percentile latency (ns)": 17880815, "95.00 percentile latency (ns)": 19362835, "97.00 percentile latency (ns)": 20917369, "99.00 percentile latency (ns)": 29810765, "99.90 percentile latency (ns)": 87706362, "Max latency (ns)": 127367813, "Mean latency (ns)": 13335248, "Min duration satisfied": "Yes", "Min latency (ns)": 10722184, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 74.9, "QPS w/o loadgen overhead": 74.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.880815, "characteristics.90th_percentile_latency_ns": 17880815.0, "characteristics.90th_percentile_latency_s": 0.017880815, "characteristics.90th_percentile_latency_us": 17880.815, "characteristics.accuracy": 72.91, "characteristics.good": 36455, "characteristics.power": 0.27666902080048605, "characteristics.power.normalized_per_core": 0.0023055751733373838, "characteristics.power.normalized_per_processor": 0.27666902080048605, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8fc57f8a4520939b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12990045, "90.00 percentile latency (ns)": 19475194, "90th percentile latency (ns)": 19475194, "95.00 percentile latency (ns)": 20714974, "97.00 percentile latency (ns)": 22275665, "99.00 percentile latency (ns)": 31295369, "99.90 percentile latency (ns)": 91441790, "Max latency (ns)": 127955318, "Mean latency (ns)": 14685748, "Min duration satisfied": "Yes", "Min latency (ns)": 11428565, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 68.04, "QPS w/o loadgen overhead": 68.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.475194, "characteristics.90th_percentile_latency_ns": 19475194.0, "characteristics.90th_percentile_latency_s": 0.019475194, "characteristics.90th_percentile_latency_us": 19475.194, "characteristics.accuracy": 70.542, "characteristics.good": 35271, "characteristics.power": 0.3004288943696957, "characteristics.power.normalized_per_core": 0.0025035741197474643, "characteristics.power.normalized_per_processor": 0.3004288943696957, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4ba9d585443a9dd5", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4492967, "90.00 percentile latency (ns)": 5186470, "90th percentile latency (ns)": 5186470, "95.00 percentile latency (ns)": 6061646, "97.00 percentile latency (ns)": 6953301, "99.00 percentile latency (ns)": 10901157, "99.90 percentile latency (ns)": 45914866, "Max latency (ns)": 120802112, "Mean latency (ns)": 4868536, "Min duration satisfied": "Yes", "Min latency (ns)": 4032179, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 205.05, "QPS w/o loadgen overhead": 205.4, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.18647, "characteristics.90th_percentile_latency_ns": 5186470.0, "characteristics.90th_percentile_latency_s": 0.00518647, "characteristics.90th_percentile_latency_us": 5186.47, "characteristics.accuracy": 56.594, "characteristics.good": 28297, "characteristics.power": 0.09591689100438282, "characteristics.power.normalized_per_core": 0.0007993074250365235, "characteristics.power.normalized_per_processor": 0.09591689100438282, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "49950294400b037a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7687393, "90.00 percentile latency (ns)": 12927143, "90th percentile latency (ns)": 12927143, "95.00 percentile latency (ns)": 14700340, "97.00 percentile latency (ns)": 15407179, "99.00 percentile latency (ns)": 20440892, "99.90 percentile latency (ns)": 79000104, "Max latency (ns)": 127473706, "Mean latency (ns)": 8832296, "Min duration satisfied": "Yes", "Min latency (ns)": 6603108, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 113.1, "QPS w/o loadgen overhead": 113.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.927143, "characteristics.90th_percentile_latency_ns": 12927143.0, "characteristics.90th_percentile_latency_s": 0.012927143, "characteristics.90th_percentile_latency_us": 12927.143, "characteristics.accuracy": 67.82, "characteristics.good": 33910, "characteristics.power": 0.17916353530262985, "characteristics.power.normalized_per_core": 0.0014930294608552488, "characteristics.power.normalized_per_processor": 0.17916353530262985, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "51a809f354677a0b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1352226, "90.00 percentile latency (ns)": 1490246, "90th percentile latency (ns)": 1490246, "95.00 percentile latency (ns)": 1613261, "97.00 percentile latency (ns)": 1972829, "99.00 percentile latency (ns)": 2908395, "99.90 percentile latency (ns)": 21150298, "Max latency (ns)": 74481020, "Mean latency (ns)": 1462121, "Min duration satisfied": "Yes", "Min latency (ns)": 1166743, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 682.05, "QPS w/o loadgen overhead": 683.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 1.490246, "characteristics.90th_percentile_latency_ns": 1490246.0, "characteristics.90th_percentile_latency_s": 0.001490246, "characteristics.90th_percentile_latency_us": 1490.246, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.power": 0.031754423776451386, "characteristics.power.normalized_per_core": 0.00026462019813709486, "characteristics.power.normalized_per_processor": 0.031754423776451386, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "894c87afaa46c7e0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1887665, "90.00 percentile latency (ns)": 2278209, "90th percentile latency (ns)": 2278209, "95.00 percentile latency (ns)": 3088678, "97.00 percentile latency (ns)": 3843623, "99.00 percentile latency (ns)": 6087306, "99.90 percentile latency (ns)": 28873225, "Max latency (ns)": 76294812, "Mean latency (ns)": 2139917, "Min duration satisfied": "Yes", "Min latency (ns)": 1650791, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 466.54, "QPS w/o loadgen overhead": 467.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.278209, "characteristics.90th_percentile_latency_ns": 2278209.0, "characteristics.90th_percentile_latency_s": 0.002278209, "characteristics.90th_percentile_latency_us": 2278.209, "characteristics.accuracy": 45.494, "characteristics.good": 22747, "characteristics.power": 0.04322627639181518, "characteristics.power.normalized_per_core": 0.0003602189699317932, "characteristics.power.normalized_per_processor": 0.04322627639181518, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bb50cadfda4ee2b2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9006575, "90.00 percentile latency (ns)": 10921764, "90th percentile latency (ns)": 10921764, "95.00 percentile latency (ns)": 13687999, "97.00 percentile latency (ns)": 15144896, "99.00 percentile latency (ns)": 21287504, "99.90 percentile latency (ns)": 70129956, "Max latency (ns)": 97232185, "Mean latency (ns)": 9986350, "Min duration satisfied": "Yes", "Min latency (ns)": 8223020, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 99.91, "QPS w/o loadgen overhead": 100.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.921764, "characteristics.90th_percentile_latency_ns": 10921764.0, "characteristics.90th_percentile_latency_s": 0.010921764, "characteristics.90th_percentile_latency_us": 10921.764, "characteristics.accuracy": 70.626, "characteristics.good": 35313, "characteristics.power": 0.267898566753444, "characteristics.power.normalized_per_core": 0.0022324880562787, "characteristics.power.normalized_per_processor": 0.267898566753444, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1df93e7afc6d4ae9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5975110, "90.00 percentile latency (ns)": 9023916, "90th percentile latency (ns)": 9023916, "95.00 percentile latency (ns)": 11250711, "97.00 percentile latency (ns)": 12575766, "99.00 percentile latency (ns)": 14732254, "99.90 percentile latency (ns)": 70569658, "Max latency (ns)": 121054480, "Mean latency (ns)": 6880608, "Min duration satisfied": "Yes", "Min latency (ns)": 5176086, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 145.12, "QPS w/o loadgen overhead": 145.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.023916, "characteristics.90th_percentile_latency_ns": 9023916.0, "characteristics.90th_percentile_latency_s": 0.009023916, "characteristics.90th_percentile_latency_us": 9023.916, "characteristics.accuracy": 63.454, "characteristics.good": 31727, "characteristics.power": 0.13725244283962015, "characteristics.power.normalized_per_core": 0.0011437703569968346, "characteristics.power.normalized_per_processor": 0.13725244283962015, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2a664d084117aea0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11422922, "90.00 percentile latency (ns)": 13050674, "90th percentile latency (ns)": 13050674, "95.00 percentile latency (ns)": 14170082, "97.00 percentile latency (ns)": 16386707, "99.00 percentile latency (ns)": 26609148, "99.90 percentile latency (ns)": 72188969, "Max latency (ns)": 90822857, "Mean latency (ns)": 12091516, "Min duration satisfied": "Yes", "Min latency (ns)": 10337465, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 82.61, "QPS w/o loadgen overhead": 82.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.050674, "characteristics.90th_percentile_latency_ns": 13050674.0, "characteristics.90th_percentile_latency_s": 0.013050674, "characteristics.90th_percentile_latency_us": 13050.674, "characteristics.accuracy": 70.04, "characteristics.good": 35020, "characteristics.power": 0.25027649767725774, "characteristics.power.normalized_per_core": 0.0020856374806438147, "characteristics.power.normalized_per_processor": 0.25027649767725774, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1501a7561539427a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 27689468, "90.00 percentile latency (ns)": 40099248, "90th percentile latency (ns)": 40099248, "95.00 percentile latency (ns)": 45296254, "97.00 percentile latency (ns)": 49511439, "99.00 percentile latency (ns)": 53797086, "99.90 percentile latency (ns)": 94966591, "Max latency (ns)": 131743916, "Mean latency (ns)": 31335580, "Min duration satisfied": "Yes", "Min latency (ns)": 25825962, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 31.9, "QPS w/o loadgen overhead": 31.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.099248, "characteristics.90th_percentile_latency_ns": 40099248.0, "characteristics.90th_percentile_latency_s": 0.040099248, "characteristics.90th_percentile_latency_us": 40099.248, "characteristics.accuracy": 74.124, "characteristics.good": 37062, "characteristics.power": 0.6592394729169214, "characteristics.power.normalized_per_core": 0.005493662274307679, "characteristics.power.normalized_per_processor": 0.6592394729169214, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "45b4525963d9269f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3362741, "90.00 percentile latency (ns)": 3778665, "90th percentile latency (ns)": 3778665, "95.00 percentile latency (ns)": 5394035, "97.00 percentile latency (ns)": 6858773, "99.00 percentile latency (ns)": 9602024, "99.90 percentile latency (ns)": 39363655, "Max latency (ns)": 79693809, "Mean latency (ns)": 3712467, "Min duration satisfied": "Yes", "Min latency (ns)": 2913794, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 268.98, "QPS w/o loadgen overhead": 269.36, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.778665, "characteristics.90th_percentile_latency_ns": 3778665.0, "characteristics.90th_percentile_latency_s": 0.003778665, "characteristics.90th_percentile_latency_us": 3778.665, "characteristics.accuracy": 59.444, "characteristics.good": 29722, "characteristics.power": 0.07542725430786104, "characteristics.power.normalized_per_core": 0.0006285604525655086, "characteristics.power.normalized_per_processor": 0.07542725430786104, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a2e483c875be0642", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4340208, "90.00 percentile latency (ns)": 4831943, "90th percentile latency (ns)": 4831943, "95.00 percentile latency (ns)": 6739688, "97.00 percentile latency (ns)": 8492073, "99.00 percentile latency (ns)": 11164128, "99.90 percentile latency (ns)": 28509981, "Max latency (ns)": 75223883, "Mean latency (ns)": 4719617, "Min duration satisfied": "Yes", "Min latency (ns)": 3946038, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 211.58, "QPS w/o loadgen overhead": 211.88, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.831943, "characteristics.90th_percentile_latency_ns": 4831943.0, "characteristics.90th_percentile_latency_s": 0.004831943, "characteristics.90th_percentile_latency_us": 4831.943, "characteristics.accuracy": 61.456, "characteristics.good": 30728, "characteristics.power": 0.09543183794615834, "characteristics.power.normalized_per_core": 0.0007952653162179861, "characteristics.power.normalized_per_processor": 0.09543183794615834, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "da686d873486bac9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5642449, "90.00 percentile latency (ns)": 6821245, "90th percentile latency (ns)": 6821245, "95.00 percentile latency (ns)": 8666315, "97.00 percentile latency (ns)": 10812701, "99.00 percentile latency (ns)": 13665247, "99.90 percentile latency (ns)": 63989948, "Max latency (ns)": 111954722, "Mean latency (ns)": 6201014, "Min duration satisfied": "Yes", "Min latency (ns)": 4956459, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 161.04, "QPS w/o loadgen overhead": 161.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.821245, "characteristics.90th_percentile_latency_ns": 6821245.0, "characteristics.90th_percentile_latency_s": 0.006821245, "characteristics.90th_percentile_latency_us": 6821.245, "characteristics.accuracy": 58.528, "characteristics.good": 29264, "characteristics.power": 0.12400526166539348, "characteristics.power.normalized_per_core": 0.0010333771805449458, "characteristics.power.normalized_per_processor": 0.12400526166539348, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ef97e99e97f89c4c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4098168, "90.00 percentile latency (ns)": 6067120, "90th percentile latency (ns)": 6067120, "95.00 percentile latency (ns)": 7576725, "97.00 percentile latency (ns)": 8756522, "99.00 percentile latency (ns)": 11505188, "99.90 percentile latency (ns)": 48980883, "Max latency (ns)": 136063475, "Mean latency (ns)": 4746816, "Min duration satisfied": "Yes", "Min latency (ns)": 3586722, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 209.88, "QPS w/o loadgen overhead": 210.67, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.06712, "characteristics.90th_percentile_latency_ns": 6067120.0, "characteristics.90th_percentile_latency_s": 0.00606712, "characteristics.90th_percentile_latency_us": 6067.12, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.power": 0.11695651483387338, "characteristics.power.normalized_per_core": 0.0009746376236156115, "characteristics.power.normalized_per_processor": 0.11695651483387338, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7baaadc697dd771c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16788660, "90.00 percentile latency (ns)": 21488871, "90th percentile latency (ns)": 21488871, "95.00 percentile latency (ns)": 23942219, "97.00 percentile latency (ns)": 24711608, "99.00 percentile latency (ns)": 33368065, "99.90 percentile latency (ns)": 83772813, "Max latency (ns)": 129348687, "Mean latency (ns)": 17594625, "Min duration satisfied": "Yes", "Min latency (ns)": 14104111, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 56.77, "QPS w/o loadgen overhead": 56.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.488871, "characteristics.90th_percentile_latency_ns": 21488871.0, "characteristics.90th_percentile_latency_s": 0.021488871, "characteristics.90th_percentile_latency_us": 21488.871, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.4705830893862166, "characteristics.power.normalized_per_core": 0.003921525744885138, "characteristics.power.normalized_per_processor": 0.4705830893862166, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5f8a4ad99a7b1c38", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10068923, "90.00 percentile latency (ns)": 16896820, "90th percentile latency (ns)": 16896820, "95.00 percentile latency (ns)": 18957921, "97.00 percentile latency (ns)": 20346252, "99.00 percentile latency (ns)": 26969356, "99.90 percentile latency (ns)": 91451293, "Max latency (ns)": 132020057, "Mean latency (ns)": 11687638, "Min duration satisfied": "Yes", "Min latency (ns)": 8694860, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 85.48, "QPS w/o loadgen overhead": 85.56, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.89682, "characteristics.90th_percentile_latency_ns": 16896820.0, "characteristics.90th_percentile_latency_s": 0.01689682, "characteristics.90th_percentile_latency_us": 16896.82, "characteristics.accuracy": 69.604, "characteristics.good": 34802, "characteristics.power": 0.23702480099423917, "characteristics.power.normalized_per_core": 0.001975206674951993, "characteristics.power.normalized_per_processor": 0.23702480099423917, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d004d9e888782a02", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9077702, "90.00 percentile latency (ns)": 11225873, "90th percentile latency (ns)": 11225873, "95.00 percentile latency (ns)": 13691482, "97.00 percentile latency (ns)": 15085603, "99.00 percentile latency (ns)": 22884901, "99.90 percentile latency (ns)": 69236771, "Max latency (ns)": 97011245, "Mean latency (ns)": 9514962, "Min duration satisfied": "Yes", "Min latency (ns)": 7612679, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 104.87, "QPS w/o loadgen overhead": 105.1, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.225873, "characteristics.90th_percentile_latency_ns": 11225873.0, "characteristics.90th_percentile_latency_s": 0.011225873, "characteristics.90th_percentile_latency_us": 11225.873, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.power": 0.2425895377221756, "characteristics.power.normalized_per_core": 0.0020215794810181298, "characteristics.power.normalized_per_processor": 0.2425895377221756, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f746fdacf8b91433", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11130326, "90.00 percentile latency (ns)": 17121202, "90th percentile latency (ns)": 17121202, "95.00 percentile latency (ns)": 18429414, "97.00 percentile latency (ns)": 19261134, "99.00 percentile latency (ns)": 28785963, "99.90 percentile latency (ns)": 91108410, "Max latency (ns)": 122111849, "Mean latency (ns)": 12573505, "Min duration satisfied": "Yes", "Min latency (ns)": 9572222, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 79.46, "QPS w/o loadgen overhead": 79.53, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.121202, "characteristics.90th_percentile_latency_ns": 17121202.0, "characteristics.90th_percentile_latency_s": 0.017121202, "characteristics.90th_percentile_latency_us": 17121.202, "characteristics.accuracy": 68.734, "characteristics.good": 34367, "characteristics.power": 0.2568031448630435, "characteristics.power.normalized_per_core": 0.0021400262071920293, "characteristics.power.normalized_per_processor": 0.2568031448630435, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "91ca54a79b1c914e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3643170, "90.00 percentile latency (ns)": 4146295, "90th percentile latency (ns)": 4146295, "95.00 percentile latency (ns)": 4849714, "97.00 percentile latency (ns)": 5695161, "99.00 percentile latency (ns)": 8902408, "99.90 percentile latency (ns)": 41693477, "Max latency (ns)": 111844487, "Mean latency (ns)": 3948045, "Min duration satisfied": "Yes", "Min latency (ns)": 3175085, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 252.23, "QPS w/o loadgen overhead": 253.29, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.146295, "characteristics.90th_percentile_latency_ns": 4146295.0, "characteristics.90th_percentile_latency_s": 0.004146295, "characteristics.90th_percentile_latency_us": 4146.295, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.power": 0.09158473151701596, "characteristics.power.normalized_per_core": 0.000763206095975133, "characteristics.power.normalized_per_processor": 0.09158473151701596, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "442afb80b06e1cd3", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1961159, "90.00 percentile latency (ns)": 2230709, "90th percentile latency (ns)": 2230709, "95.00 percentile latency (ns)": 2512715, "97.00 percentile latency (ns)": 3075935, "99.00 percentile latency (ns)": 4424100, "99.90 percentile latency (ns)": 25260456, "Max latency (ns)": 79646906, "Mean latency (ns)": 2142206, "Min duration satisfied": "Yes", "Min latency (ns)": 1749051, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 465.05, "QPS w/o loadgen overhead": 466.81, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.230709, "characteristics.90th_percentile_latency_ns": 2230709.0, "characteristics.90th_percentile_latency_s": 0.002230709, "characteristics.90th_percentile_latency_us": 2230.709, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.power": 0.052892413002186195, "characteristics.power.normalized_per_core": 0.00044077010835155163, "characteristics.power.normalized_per_processor": 0.052892413002186195, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "cf74602bfdfc48c2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12181186, "90.00 percentile latency (ns)": 15314498, "90th percentile latency (ns)": 15314498, "95.00 percentile latency (ns)": 17713044, "97.00 percentile latency (ns)": 18957131, "99.00 percentile latency (ns)": 26293749, "99.90 percentile latency (ns)": 66273194, "Max latency (ns)": 86073327, "Mean latency (ns)": 13343739, "Min duration satisfied": "Yes", "Min latency (ns)": 11153917, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 74.83, "QPS w/o loadgen overhead": 74.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.314498, "characteristics.90th_percentile_latency_ns": 15314498.0, "characteristics.90th_percentile_latency_s": 0.015314498, "characteristics.90th_percentile_latency_us": 15314.498, "characteristics.accuracy": 71.676, "characteristics.good": 35838, "characteristics.power": 0.35377465018354415, "characteristics.power.normalized_per_core": 0.002948122084862868, "characteristics.power.normalized_per_processor": 0.35377465018354415, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "555417f4fc7ae893", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1938673, "90.00 percentile latency (ns)": 2145877, "90th percentile latency (ns)": 2145877, "95.00 percentile latency (ns)": 2668495, "97.00 percentile latency (ns)": 3316480, "99.00 percentile latency (ns)": 4958059, "99.90 percentile latency (ns)": 26086114, "Max latency (ns)": 98213600, "Mean latency (ns)": 2127361, "Min duration satisfied": "Yes", "Min latency (ns)": 1684550, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 469.29, "QPS w/o loadgen overhead": 470.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.145877, "characteristics.90th_percentile_latency_ns": 2145877.0, "characteristics.90th_percentile_latency_s": 0.002145877, "characteristics.90th_percentile_latency_us": 2145.877, "characteristics.accuracy": 43.468, "characteristics.good": 21734, "characteristics.power": 0.04211669142042535, "characteristics.power.normalized_per_core": 0.0003509724285035446, "characteristics.power.normalized_per_processor": 0.04211669142042535, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "74f17b4269fa9403", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 52390715, "90.00 percentile latency (ns)": 67754253, "90th percentile latency (ns)": 67754253, "95.00 percentile latency (ns)": 70348269, "97.00 percentile latency (ns)": 73303283, "99.00 percentile latency (ns)": 82868245, "99.90 percentile latency (ns)": 135484751, "Max latency (ns)": 168887474, "Mean latency (ns)": 56749943, "Min duration satisfied": "Yes", "Min latency (ns)": 48470052, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.62, "QPS w/o loadgen overhead": 17.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 67.754253, "characteristics.90th_percentile_latency_ns": 67754253.0, "characteristics.90th_percentile_latency_s": 0.067754253, "characteristics.90th_percentile_latency_us": 67754.253, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 1.5957546841665073, "characteristics.power.normalized_per_core": 0.013297955701387561, "characteristics.power.normalized_per_processor": 1.5957546841665073, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2874bef9b97dfa09", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10116552, "90.00 percentile latency (ns)": 16051294, "90th percentile latency (ns)": 16051294, "95.00 percentile latency (ns)": 17369116, "97.00 percentile latency (ns)": 18169298, "99.00 percentile latency (ns)": 26397666, "99.90 percentile latency (ns)": 79916187, "Max latency (ns)": 121147232, "Mean latency (ns)": 11469463, "Min duration satisfied": "Yes", "Min latency (ns)": 8864854, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 87.11, "QPS w/o loadgen overhead": 87.19, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.051294, "characteristics.90th_percentile_latency_ns": 16051294.0, "characteristics.90th_percentile_latency_s": 0.016051294, "characteristics.90th_percentile_latency_us": 16051.294, "characteristics.accuracy": 70.43, "characteristics.good": 35215, "characteristics.power": 0.2321617850880917, "characteristics.power.normalized_per_core": 0.0019346815424007642, "characteristics.power.normalized_per_processor": 0.2321617850880917, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9c8dd58556c10401", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8010390, "90.00 percentile latency (ns)": 10347189, "90th percentile latency (ns)": 10347189, "95.00 percentile latency (ns)": 14184363, "97.00 percentile latency (ns)": 15420046, "99.00 percentile latency (ns)": 19839660, "99.90 percentile latency (ns)": 74003003, "Max latency (ns)": 137014167, "Mean latency (ns)": 8904344, "Min duration satisfied": "Yes", "Min latency (ns)": 7315348, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 112.19, "QPS w/o loadgen overhead": 112.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.347189, "characteristics.90th_percentile_latency_ns": 10347189.0, "characteristics.90th_percentile_latency_s": 0.010347189, "characteristics.90th_percentile_latency_us": 10347.189, "characteristics.accuracy": 67.474, "characteristics.good": 33737, "characteristics.power": 0.17992637621220758, "characteristics.power.normalized_per_core": 0.0014993864684350632, "characteristics.power.normalized_per_processor": 0.17992637621220758, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "62e1449aab80aa2f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8205284, "90.00 percentile latency (ns)": 9930068, "90th percentile latency (ns)": 9930068, "95.00 percentile latency (ns)": 12211031, "97.00 percentile latency (ns)": 14017437, "99.00 percentile latency (ns)": 20770704, "99.90 percentile latency (ns)": 66929746, "Max latency (ns)": 81404605, "Mean latency (ns)": 8897915, "Min duration satisfied": "Yes", "Min latency (ns)": 7318556, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 112.27, "QPS w/o loadgen overhead": 112.39, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.930068, "characteristics.90th_percentile_latency_ns": 9930068.0, "characteristics.90th_percentile_latency_s": 0.009930068, "characteristics.90th_percentile_latency_us": 9930.068, "characteristics.accuracy": 67.24, "characteristics.good": 33620, "characteristics.power": 0.1799292492043132, "characteristics.power.normalized_per_core": 0.0014994104100359432, "characteristics.power.normalized_per_processor": 0.1799292492043132, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8986754720fcf863", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4970164, "90.00 percentile latency (ns)": 6809054, "90th percentile latency (ns)": 6809054, "95.00 percentile latency (ns)": 8479048, "97.00 percentile latency (ns)": 9828545, "99.00 percentile latency (ns)": 12153351, "99.90 percentile latency (ns)": 30156229, "Max latency (ns)": 87896476, "Mean latency (ns)": 5525220, "Min duration satisfied": "Yes", "Min latency (ns)": 4416349, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 180.42, "QPS w/o loadgen overhead": 180.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.809054, "characteristics.90th_percentile_latency_ns": 6809054.0, "characteristics.90th_percentile_latency_s": 0.006809054, "characteristics.90th_percentile_latency_us": 6809.054, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.power": 0.1381320577628, "characteristics.power.normalized_per_core": 0.0011511004813566665, "characteristics.power.normalized_per_processor": 0.1381320577628, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "256a7067664c102a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3898617, "90.00 percentile latency (ns)": 5422324, "90th percentile latency (ns)": 5422324, "95.00 percentile latency (ns)": 6852940, "97.00 percentile latency (ns)": 7960887, "99.00 percentile latency (ns)": 10340725, "99.90 percentile latency (ns)": 28495932, "Max latency (ns)": 74529157, "Mean latency (ns)": 4374770, "Min duration satisfied": "Yes", "Min latency (ns)": 3441063, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 227.57, "QPS w/o loadgen overhead": 228.58, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.422324, "characteristics.90th_percentile_latency_ns": 5422324.0, "characteristics.90th_percentile_latency_s": 0.005422324, "characteristics.90th_percentile_latency_us": 5422.324, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.power": 0.10825317449506157, "characteristics.power.normalized_per_core": 0.0009021097874588464, "characteristics.power.normalized_per_processor": 0.10825317449506157, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "cc69d44e089de40d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3294329, "90.00 percentile latency (ns)": 4155685, "90th percentile latency (ns)": 4155685, "95.00 percentile latency (ns)": 5188377, "97.00 percentile latency (ns)": 6214183, "99.00 percentile latency (ns)": 9453212, "99.90 percentile latency (ns)": 36187142, "Max latency (ns)": 130500545, "Mean latency (ns)": 3673477, "Min duration satisfied": "Yes", "Min latency (ns)": 2833923, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 271.4, "QPS w/o loadgen overhead": 272.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.155685, "characteristics.90th_percentile_latency_ns": 4155685.0, "characteristics.90th_percentile_latency_s": 0.004155685, "characteristics.90th_percentile_latency_us": 4155.685, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.power": 0.08711558183950821, "characteristics.power.normalized_per_core": 0.0007259631819959018, "characteristics.power.normalized_per_processor": 0.08711558183950821, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "50f24aa5c4cee861", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4816120, "90.00 percentile latency (ns)": 6940885, "90th percentile latency (ns)": 6940885, "95.00 percentile latency (ns)": 8608322, "97.00 percentile latency (ns)": 9725812, "99.00 percentile latency (ns)": 12230500, "99.90 percentile latency (ns)": 55170538, "Max latency (ns)": 75521201, "Mean latency (ns)": 5497462, "Min duration satisfied": "Yes", "Min latency (ns)": 4333634, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 181.27, "QPS w/o loadgen overhead": 181.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.940885, "characteristics.90th_percentile_latency_ns": 6940885.0, "characteristics.90th_percentile_latency_s": 0.006940885, "characteristics.90th_percentile_latency_us": 6940.885, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.power": 0.1397018828163358, "characteristics.power.normalized_per_core": 0.0011641823568027984, "characteristics.power.normalized_per_processor": 0.1397018828163358, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2b113638744b1bfc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2476397, "90.00 percentile latency (ns)": 3066855, "90th percentile latency (ns)": 3066855, "95.00 percentile latency (ns)": 4063474, "97.00 percentile latency (ns)": 4811541, "99.00 percentile latency (ns)": 7659186, "99.90 percentile latency (ns)": 30138862, "Max latency (ns)": 106838091, "Mean latency (ns)": 2788294, "Min duration satisfied": "Yes", "Min latency (ns)": 2187072, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 357.98, "QPS w/o loadgen overhead": 358.64, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.066855, "characteristics.90th_percentile_latency_ns": 3066855.0, "characteristics.90th_percentile_latency_s": 0.003066855, "characteristics.90th_percentile_latency_us": 3066.855, "characteristics.accuracy": 49.11, "characteristics.good": 24555, "characteristics.power": 0.054944568907561483, "characteristics.power.normalized_per_core": 0.00045787140756301236, "characteristics.power.normalized_per_processor": 0.054944568907561483, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "37d9351bf91c73cf", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4910176, "90.00 percentile latency (ns)": 5958194, "90th percentile latency (ns)": 5958194, "95.00 percentile latency (ns)": 7338965, "97.00 percentile latency (ns)": 9296754, "99.00 percentile latency (ns)": 12669668, "99.90 percentile latency (ns)": 56919452, "Max latency (ns)": 122619405, "Mean latency (ns)": 5429563, "Min duration satisfied": "Yes", "Min latency (ns)": 4342984, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 183.91, "QPS w/o loadgen overhead": 184.18, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.958194, "characteristics.90th_percentile_latency_ns": 5958194.0, "characteristics.90th_percentile_latency_s": 0.005958194, "characteristics.90th_percentile_latency_us": 5958.194, "characteristics.accuracy": 62.07, "characteristics.good": 31035, "characteristics.power": 0.10830995284027668, "characteristics.power.normalized_per_core": 0.000902582940335639, "characteristics.power.normalized_per_processor": 0.10830995284027668, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f940a8a71192728d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3212719, "90.00 percentile latency (ns)": 5168166, "90th percentile latency (ns)": 5168166, "95.00 percentile latency (ns)": 6475809, "97.00 percentile latency (ns)": 7534417, "99.00 percentile latency (ns)": 10119203, "99.90 percentile latency (ns)": 34414402, "Max latency (ns)": 123172729, "Mean latency (ns)": 3803621, "Min duration satisfied": "Yes", "Min latency (ns)": 2660439, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 261.73, "QPS w/o loadgen overhead": 262.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.168166, "characteristics.90th_percentile_latency_ns": 5168166.0, "characteristics.90th_percentile_latency_s": 0.005168166, "characteristics.90th_percentile_latency_us": 5168.166, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.power": 0.09203588230948904, "characteristics.power.normalized_per_core": 0.0007669656859124087, "characteristics.power.normalized_per_processor": 0.09203588230948904, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "492d64cf69350c29", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1612615, "90.00 percentile latency (ns)": 1802060, "90th percentile latency (ns)": 1802060, "95.00 percentile latency (ns)": 2370600, "97.00 percentile latency (ns)": 2789019, "99.00 percentile latency (ns)": 4093457, "99.90 percentile latency (ns)": 22684358, "Max latency (ns)": 75931763, "Mean latency (ns)": 1768185, "Min duration satisfied": "Yes", "Min latency (ns)": 1273560, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 564.44, "QPS w/o loadgen overhead": 565.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 1.80206, "characteristics.90th_percentile_latency_ns": 1802060.0, "characteristics.90th_percentile_latency_s": 0.00180206, "characteristics.90th_percentile_latency_us": 1802.06, "characteristics.accuracy": 42.384, "characteristics.good": 21192, "characteristics.power": 0.034206939478871726, "characteristics.power.normalized_per_core": 0.0002850578289905977, "characteristics.power.normalized_per_processor": 0.034206939478871726, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "11095288452b968e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13330121, "90.00 percentile latency (ns)": 19891031, "90th percentile latency (ns)": 19891031, "95.00 percentile latency (ns)": 20889930, "97.00 percentile latency (ns)": 21914047, "99.00 percentile latency (ns)": 32638019, "99.90 percentile latency (ns)": 111747019, "Max latency (ns)": 136531740, "Mean latency (ns)": 15456335, "Min duration satisfied": "Yes", "Min latency (ns)": 12122155, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 64.61, "QPS w/o loadgen overhead": 64.7, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.891031, "characteristics.90th_percentile_latency_ns": 19891031.0, "characteristics.90th_percentile_latency_s": 0.019891031, "characteristics.90th_percentile_latency_us": 19891.031, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.power": 0.4054171458169853, "characteristics.power.normalized_per_core": 0.003378476215141544, "characteristics.power.normalized_per_processor": 0.4054171458169853, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "cab198a8183e7b7d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4850903, "90.00 percentile latency (ns)": 5897061, "90th percentile latency (ns)": 5897061, "95.00 percentile latency (ns)": 7375624, "97.00 percentile latency (ns)": 8889925, "99.00 percentile latency (ns)": 12105911, "99.90 percentile latency (ns)": 43993932, "Max latency (ns)": 112061141, "Mean latency (ns)": 5344462, "Min duration satisfied": "Yes", "Min latency (ns)": 4349247, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 186.8, "QPS w/o loadgen overhead": 187.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.897061, "characteristics.90th_percentile_latency_ns": 5897061.0, "characteristics.90th_percentile_latency_s": 0.005897061, "characteristics.90th_percentile_latency_us": 5897.061, "characteristics.accuracy": 64.486, "characteristics.good": 32243, "characteristics.power": 0.11193423017831604, "characteristics.power.normalized_per_core": 0.000932785251485967, "characteristics.power.normalized_per_processor": 0.11193423017831604, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3628456ea840a717", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20342460, "90.00 percentile latency (ns)": 27726474, "90th percentile latency (ns)": 27726474, "95.00 percentile latency (ns)": 29065095, "97.00 percentile latency (ns)": 30234588, "99.00 percentile latency (ns)": 39332282, "99.90 percentile latency (ns)": 86504020, "Max latency (ns)": 118384094, "Mean latency (ns)": 22009131, "Min duration satisfied": "Yes", "Min latency (ns)": 19306924, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 45.39, "QPS w/o loadgen overhead": 45.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 27.726474, "characteristics.90th_percentile_latency_ns": 27726474.0, "characteristics.90th_percentile_latency_s": 0.027726474, "characteristics.90th_percentile_latency_us": 27726.474, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.6037751021712061, "characteristics.power.normalized_per_core": 0.005031459184760051, "characteristics.power.normalized_per_processor": 0.6037751021712061, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ef9ba73c5cff8dd1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2606485, "90.00 percentile latency (ns)": 2818686, "90th percentile latency (ns)": 2818686, "95.00 percentile latency (ns)": 3019527, "97.00 percentile latency (ns)": 3919727, "99.00 percentile latency (ns)": 6331067, "99.90 percentile latency (ns)": 22142716, "Max latency (ns)": 71836983, "Mean latency (ns)": 2775435, "Min duration satisfied": "Yes", "Min latency (ns)": 2334537, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 359.72, "QPS w/o loadgen overhead": 360.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.818686, "characteristics.90th_percentile_latency_ns": 2818686.0, "characteristics.90th_percentile_latency_s": 0.002818686, "characteristics.90th_percentile_latency_us": 2818.686, "characteristics.accuracy": 56.75, "characteristics.good": 28375, "characteristics.power": 0.054590986212539376, "characteristics.power.normalized_per_core": 0.0004549248851044948, "characteristics.power.normalized_per_processor": 0.054590986212539376, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c4953bb8e4b42679", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3443321, "90.00 percentile latency (ns)": 4885464, "90th percentile latency (ns)": 4885464, "95.00 percentile latency (ns)": 6511652, "97.00 percentile latency (ns)": 7859807, "99.00 percentile latency (ns)": 10664085, "99.90 percentile latency (ns)": 36329778, "Max latency (ns)": 117415463, "Mean latency (ns)": 3965685, "Min duration satisfied": "Yes", "Min latency (ns)": 2999878, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 251.76, "QPS w/o loadgen overhead": 252.16, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.885464, "characteristics.90th_percentile_latency_ns": 4885464.0, "characteristics.90th_percentile_latency_s": 0.004885464, "characteristics.90th_percentile_latency_us": 4885.464, "characteristics.accuracy": 57.002, "characteristics.good": 28501, "characteristics.power": 0.07876951105356056, "characteristics.power.normalized_per_core": 0.0006564125921130047, "characteristics.power.normalized_per_processor": 0.07876951105356056, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e6438b3314aa3a65", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15796054, "90.00 percentile latency (ns)": 21690501, "90th percentile latency (ns)": 21690501, "95.00 percentile latency (ns)": 23132942, "97.00 percentile latency (ns)": 24169136, "99.00 percentile latency (ns)": 34124798, "99.90 percentile latency (ns)": 127934583, "Max latency (ns)": 154512302, "Mean latency (ns)": 17285338, "Min duration satisfied": "Yes", "Min latency (ns)": 13343500, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.78, "QPS w/o loadgen overhead": 57.85, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.690501, "characteristics.90th_percentile_latency_ns": 21690501.0, "characteristics.90th_percentile_latency_s": 0.021690501, "characteristics.90th_percentile_latency_us": 21690.501, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.power": 0.45689485088472276, "characteristics.power.normalized_per_core": 0.003807457090706023, "characteristics.power.normalized_per_processor": 0.45689485088472276, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a7ff1d432c420f99", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1793200, "90.00 percentile latency (ns)": 2078708, "90th percentile latency (ns)": 2078708, "95.00 percentile latency (ns)": 2604874, "97.00 percentile latency (ns)": 3208292, "99.00 percentile latency (ns)": 5023074, "99.90 percentile latency (ns)": 25801481, "Max latency (ns)": 99697130, "Mean latency (ns)": 1999008, "Min duration satisfied": "Yes", "Min latency (ns)": 1538143, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 498.19, "QPS w/o loadgen overhead": 500.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.078708, "characteristics.90th_percentile_latency_ns": 2078708.0, "characteristics.90th_percentile_latency_s": 0.002078708, "characteristics.90th_percentile_latency_us": 2078.708, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.power": 0.04598345892028677, "characteristics.power.normalized_per_core": 0.00038319549100238975, "characteristics.power.normalized_per_processor": 0.04598345892028677, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dd5afad93e4dcdba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7663810, "90.00 percentile latency (ns)": 9368466, "90th percentile latency (ns)": 9368466, "95.00 percentile latency (ns)": 11834601, "97.00 percentile latency (ns)": 13890645, "99.00 percentile latency (ns)": 19110465, "99.90 percentile latency (ns)": 79740440, "Max latency (ns)": 125161946, "Mean latency (ns)": 8408980, "Min duration satisfied": "Yes", "Min latency (ns)": 7076032, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 118.68, "QPS w/o loadgen overhead": 118.92, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.368466, "characteristics.90th_percentile_latency_ns": 9368466.0, "characteristics.90th_percentile_latency_s": 0.009368466, "characteristics.90th_percentile_latency_us": 9368.466, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.power": 0.20973861826638668, "characteristics.power.normalized_per_core": 0.0017478218188865557, "characteristics.power.normalized_per_processor": 0.20973861826638668, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0a0453d8af8a9b45", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4401970, "90.00 percentile latency (ns)": 5476482, "90th percentile latency (ns)": 5476482, "95.00 percentile latency (ns)": 6682179, "97.00 percentile latency (ns)": 7851161, "99.00 percentile latency (ns)": 10922436, "99.90 percentile latency (ns)": 54054283, "Max latency (ns)": 98608219, "Mean latency (ns)": 4863622, "Min duration satisfied": "Yes", "Min latency (ns)": 4018173, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 204.67, "QPS w/o loadgen overhead": 205.61, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.476482, "characteristics.90th_percentile_latency_ns": 5476482.0, "characteristics.90th_percentile_latency_s": 0.005476482, "characteristics.90th_percentile_latency_us": 5476.482, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.power": 0.13143401573264293, "characteristics.power.normalized_per_core": 0.0010952834644386911, "characteristics.power.normalized_per_processor": 0.13143401573264293, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9a6bab9a6455cb50", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6883796, "90.00 percentile latency (ns)": 8377014, "90th percentile latency (ns)": 8377014, "95.00 percentile latency (ns)": 10224424, "97.00 percentile latency (ns)": 12021752, "99.00 percentile latency (ns)": 16800749, "99.90 percentile latency (ns)": 65809241, "Max latency (ns)": 85384163, "Mean latency (ns)": 7544478, "Min duration satisfied": "Yes", "Min latency (ns)": 6297145, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 132.24, "QPS w/o loadgen overhead": 132.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.377014, "characteristics.90th_percentile_latency_ns": 8377014.0, "characteristics.90th_percentile_latency_s": 0.008377014, "characteristics.90th_percentile_latency_us": 8377.014, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.power": 0.19748860691852427, "characteristics.power.normalized_per_core": 0.0016457383909877022, "characteristics.power.normalized_per_processor": 0.19748860691852427, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "06f9bb8477fb082b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2700409, "90.00 percentile latency (ns)": 3094475, "90th percentile latency (ns)": 3094475, "95.00 percentile latency (ns)": 3756230, "97.00 percentile latency (ns)": 4688530, "99.00 percentile latency (ns)": 7412361, "99.90 percentile latency (ns)": 31629666, "Max latency (ns)": 129703256, "Mean latency (ns)": 2986152, "Min duration satisfied": "Yes", "Min latency (ns)": 2375146, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 333.41, "QPS w/o loadgen overhead": 334.88, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.094475, "characteristics.90th_percentile_latency_ns": 3094475.0, "characteristics.90th_percentile_latency_s": 0.003094475, "characteristics.90th_percentile_latency_us": 3094.475, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.power": 0.06978711151901237, "characteristics.power.normalized_per_core": 0.0005815592626584365, "characteristics.power.normalized_per_processor": 0.06978711151901237, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1b89af5c5d598997", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4619376, "90.00 percentile latency (ns)": 5305251, "90th percentile latency (ns)": 5305251, "95.00 percentile latency (ns)": 6239929, "97.00 percentile latency (ns)": 7514482, "99.00 percentile latency (ns)": 11782674, "99.90 percentile latency (ns)": 52385660, "Max latency (ns)": 114098887, "Mean latency (ns)": 5022017, "Min duration satisfied": "Yes", "Min latency (ns)": 4153645, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 198.35, "QPS w/o loadgen overhead": 199.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.305251, "characteristics.90th_percentile_latency_ns": 5305251.0, "characteristics.90th_percentile_latency_s": 0.005305251, "characteristics.90th_percentile_latency_us": 5305.251, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.power": 0.11993390404743177, "characteristics.power.normalized_per_core": 0.0009994492003952647, "characteristics.power.normalized_per_processor": 0.11993390404743177, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a38a7744dc38f27e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6408609, "90.00 percentile latency (ns)": 10233899, "90th percentile latency (ns)": 10233899, "95.00 percentile latency (ns)": 11816274, "97.00 percentile latency (ns)": 12850753, "99.00 percentile latency (ns)": 16243416, "99.90 percentile latency (ns)": 75792104, "Max latency (ns)": 131115531, "Mean latency (ns)": 7547977, "Min duration satisfied": "Yes", "Min latency (ns)": 5532409, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 132.12, "QPS w/o loadgen overhead": 132.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.233899, "characteristics.90th_percentile_latency_ns": 10233899.0, "characteristics.90th_percentile_latency_s": 0.010233899, "characteristics.90th_percentile_latency_us": 10233.899, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.power": 0.18461318196152654, "characteristics.power.normalized_per_core": 0.001538443183012721, "characteristics.power.normalized_per_processor": 0.18461318196152654, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d0d444cf4c4717b7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13813975, "90.00 percentile latency (ns)": 20706785, "90th percentile latency (ns)": 20706785, "95.00 percentile latency (ns)": 21374353, "97.00 percentile latency (ns)": 21940975, "99.00 percentile latency (ns)": 30072408, "99.90 percentile latency (ns)": 76406162, "Max latency (ns)": 105469132, "Mean latency (ns)": 15895506, "Min duration satisfied": "Yes", "Min latency (ns)": 12737234, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.86, "QPS w/o loadgen overhead": 62.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.706785, "characteristics.90th_percentile_latency_ns": 20706785.0, "characteristics.90th_percentile_latency_s": 0.020706785, "characteristics.90th_percentile_latency_us": 20706.785, "characteristics.accuracy": 71.19, "characteristics.good": 35595, "characteristics.power": 0.33310636384269976, "characteristics.power.normalized_per_core": 0.0027758863653558315, "characteristics.power.normalized_per_processor": 0.33310636384269976, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8a54cb0413dbf4d1", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 31470866, "90.00 percentile latency (ns)": 42720272, "90th percentile latency (ns)": 42720272, "95.00 percentile latency (ns)": 46836714, "97.00 percentile latency (ns)": 48511990, "99.00 percentile latency (ns)": 56649510, "99.90 percentile latency (ns)": 102651561, "Max latency (ns)": 147487515, "Mean latency (ns)": 34598096, "Min duration satisfied": "Yes", "Min latency (ns)": 28584271, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 28.89, "QPS w/o loadgen overhead": 28.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.720272, "characteristics.90th_percentile_latency_ns": 42720272.0, "characteristics.90th_percentile_latency_s": 0.042720272, "characteristics.90th_percentile_latency_us": 42720.272, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 0.958766485155427, "characteristics.power.normalized_per_core": 0.007989720709628558, "characteristics.power.normalized_per_processor": 0.958766485155427, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "90c448fbab575c79", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4190750, "90.00 percentile latency (ns)": 4911710, "90th percentile latency (ns)": 4911710, "95.00 percentile latency (ns)": 5879947, "97.00 percentile latency (ns)": 7038303, "99.00 percentile latency (ns)": 10796201, "99.90 percentile latency (ns)": 48957002, "Max latency (ns)": 115493842, "Mean latency (ns)": 4571596, "Min duration satisfied": "Yes", "Min latency (ns)": 3687015, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 217.88, "QPS w/o loadgen overhead": 218.74, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.91171, "characteristics.90th_percentile_latency_ns": 4911710.0, "characteristics.90th_percentile_latency_s": 0.00491171, "characteristics.90th_percentile_latency_us": 4911.71, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.power": 0.10671707552149078, "characteristics.power.normalized_per_core": 0.0008893089626790898, "characteristics.power.normalized_per_processor": 0.10671707552149078, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f074e9ba8f508a41", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 43414374, "90.00 percentile latency (ns)": 54639225, "90th percentile latency (ns)": 54639225, "95.00 percentile latency (ns)": 57335837, "97.00 percentile latency (ns)": 59572022, "99.00 percentile latency (ns)": 69197931, "99.90 percentile latency (ns)": 114044467, "Max latency (ns)": 180294879, "Mean latency (ns)": 46167418, "Min duration satisfied": "Yes", "Min latency (ns)": 39070500, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.65, "QPS w/o loadgen overhead": 21.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 54.639225, "characteristics.90th_percentile_latency_ns": 54639225.0, "characteristics.90th_percentile_latency_s": 0.054639225, "characteristics.90th_percentile_latency_us": 54639.225, "characteristics.accuracy": 76.344, "characteristics.good": 38172, "characteristics.power": 0.9798505532669538, "characteristics.power.normalized_per_core": 0.008165421277224616, "characteristics.power.normalized_per_processor": 0.9798505532669538, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9231d44c19a4a2dc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3613564, "90.00 percentile latency (ns)": 4697962, "90th percentile latency (ns)": 4697962, "95.00 percentile latency (ns)": 5982688, "97.00 percentile latency (ns)": 7432318, "99.00 percentile latency (ns)": 10462111, "99.90 percentile latency (ns)": 41091962, "Max latency (ns)": 118523831, "Mean latency (ns)": 4072582, "Min duration satisfied": "Yes", "Min latency (ns)": 3177287, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 245.08, "QPS w/o loadgen overhead": 245.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.697962, "characteristics.90th_percentile_latency_ns": 4697962.0, "characteristics.90th_percentile_latency_s": 0.004697962, "characteristics.90th_percentile_latency_us": 4697.962, "characteristics.accuracy": 54.568, "characteristics.good": 27284, "characteristics.power": 0.08097747438973307, "characteristics.power.normalized_per_core": 0.0006748122865811089, "characteristics.power.normalized_per_processor": 0.08097747438973307, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8e9ac748eb825354", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2457198, "90.00 percentile latency (ns)": 2711065, "90th percentile latency (ns)": 2711065, "95.00 percentile latency (ns)": 3340437, "97.00 percentile latency (ns)": 3802250, "99.00 percentile latency (ns)": 5780354, "99.90 percentile latency (ns)": 33881325, "Max latency (ns)": 77816860, "Mean latency (ns)": 2671392, "Min duration satisfied": "Yes", "Min latency (ns)": 2100317, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 373.46, "QPS w/o loadgen overhead": 374.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.711065, "characteristics.90th_percentile_latency_ns": 2711065.0, "characteristics.90th_percentile_latency_s": 0.002711065, "characteristics.90th_percentile_latency_us": 2711.065, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.power": 0.06124889100720644, "characteristics.power.normalized_per_core": 0.0005104074250600536, "characteristics.power.normalized_per_processor": 0.06124889100720644, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 500, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9e75938b4b4d4c9c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9988839, "90.00 percentile latency (ns)": 12320530, "90th percentile latency (ns)": 12320530, "95.00 percentile latency (ns)": 15244269, "97.00 percentile latency (ns)": 16586074, "99.00 percentile latency (ns)": 24837705, "99.90 percentile latency (ns)": 70659830, "Max latency (ns)": 96220956, "Mean latency (ns)": 10877151, "Min duration satisfied": "Yes", "Min latency (ns)": 9148035, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 91.85, "QPS w/o loadgen overhead": 91.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.32053, "characteristics.90th_percentile_latency_ns": 12320530.0, "characteristics.90th_percentile_latency_s": 0.01232053, "characteristics.90th_percentile_latency_us": 12320.53, "characteristics.accuracy": 68.126, "characteristics.good": 34063, "characteristics.power": 0.2224353816600375, "characteristics.power.normalized_per_core": 0.0018536281805003126, "characteristics.power.normalized_per_processor": 0.2224353816600375, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3959e116c4e909be", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9259048, "90.00 percentile latency (ns)": 11655958, "90th percentile latency (ns)": 11655958, "95.00 percentile latency (ns)": 14440246, "97.00 percentile latency (ns)": 16079392, "99.00 percentile latency (ns)": 24294201, "99.90 percentile latency (ns)": 84365622, "Max latency (ns)": 123385970, "Mean latency (ns)": 10177933, "Min duration satisfied": "Yes", "Min latency (ns)": 8653804, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 98.09, "QPS w/o loadgen overhead": 98.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.655958, "characteristics.90th_percentile_latency_ns": 11655958.0, "characteristics.90th_percentile_latency_s": 0.011655958, "characteristics.90th_percentile_latency_us": 11655.958, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.power": 0.2562544326195942, "characteristics.power.normalized_per_core": 0.0021354536051632848, "characteristics.power.normalized_per_processor": 0.2562544326195942, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b478bb49d131fcc6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5683855, "90.00 percentile latency (ns)": 7933582, "90th percentile latency (ns)": 7933582, "95.00 percentile latency (ns)": 9762811, "97.00 percentile latency (ns)": 11147510, "99.00 percentile latency (ns)": 13908586, "99.90 percentile latency (ns)": 73532353, "Max latency (ns)": 148892361, "Mean latency (ns)": 6439037, "Min duration satisfied": "Yes", "Min latency (ns)": 4987603, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 154.84, "QPS w/o loadgen overhead": 155.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.933582, "characteristics.90th_percentile_latency_ns": 7933582.0, "characteristics.90th_percentile_latency_s": 0.007933582, "characteristics.90th_percentile_latency_us": 7933.582, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.power": 0.15582741324377872, "characteristics.power.normalized_per_core": 0.0012985617770314892, "characteristics.power.normalized_per_processor": 0.15582741324377872, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "45bbfdad2ab23164", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6701845, "90.00 percentile latency (ns)": 8383554, "90th percentile latency (ns)": 8383554, "95.00 percentile latency (ns)": 9979500, "97.00 percentile latency (ns)": 11779352, "99.00 percentile latency (ns)": 16705667, "99.90 percentile latency (ns)": 64145641, "Max latency (ns)": 81521707, "Mean latency (ns)": 7312294, "Min duration satisfied": "Yes", "Min latency (ns)": 6026582, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 136.57, "QPS w/o loadgen overhead": 136.76, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.383554, "characteristics.90th_percentile_latency_ns": 8383554.0, "characteristics.90th_percentile_latency_s": 0.008383554, "characteristics.90th_percentile_latency_us": 8383.554, "characteristics.accuracy": 64.768, "characteristics.good": 32384, "characteristics.power": 0.1476243824810107, "characteristics.power.normalized_per_core": 0.0012302031873417558, "characteristics.power.normalized_per_processor": 0.1476243824810107, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f28ac02f8a464cb0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8247874, "90.00 percentile latency (ns)": 13254307, "90th percentile latency (ns)": 13254307, "95.00 percentile latency (ns)": 14718119, "97.00 percentile latency (ns)": 15486069, "99.00 percentile latency (ns)": 23594050, "99.90 percentile latency (ns)": 82583648, "Max latency (ns)": 131854820, "Mean latency (ns)": 9658512, "Min duration satisfied": "Yes", "Min latency (ns)": 7160239, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 103.33, "QPS w/o loadgen overhead": 103.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.254307, "characteristics.90th_percentile_latency_ns": 13254307.0, "characteristics.90th_percentile_latency_s": 0.013254307, "characteristics.90th_percentile_latency_us": 13254.307, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.power": 0.2393135139145611, "characteristics.power.normalized_per_core": 0.0019942792826213424, "characteristics.power.normalized_per_processor": 0.2393135139145611, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "da308149bea5bea7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6202502, "90.00 percentile latency (ns)": 7734703, "90th percentile latency (ns)": 7734703, "95.00 percentile latency (ns)": 9641347, "97.00 percentile latency (ns)": 11474500, "99.00 percentile latency (ns)": 14579694, "99.90 percentile latency (ns)": 60247568, "Max latency (ns)": 79071759, "Mean latency (ns)": 6806530, "Min duration satisfied": "Yes", "Min latency (ns)": 5503369, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 146.71, "QPS w/o loadgen overhead": 146.92, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.734703, "characteristics.90th_percentile_latency_ns": 7734703.0, "characteristics.90th_percentile_latency_s": 0.007734703, "characteristics.90th_percentile_latency_us": 7734.703, "characteristics.accuracy": 64.08, "characteristics.good": 32040, "characteristics.power": 0.13822183598586846, "characteristics.power.normalized_per_core": 0.0011518486332155705, "characteristics.power.normalized_per_processor": 0.13822183598586846, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8a01f54127f7959b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4272020, "90.00 percentile latency (ns)": 5016693, "90th percentile latency (ns)": 5016693, "95.00 percentile latency (ns)": 5979871, "97.00 percentile latency (ns)": 7222096, "99.00 percentile latency (ns)": 11026353, "99.90 percentile latency (ns)": 45941030, "Max latency (ns)": 129411756, "Mean latency (ns)": 4662841, "Min duration satisfied": "Yes", "Min latency (ns)": 3737115, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 213.77, "QPS w/o loadgen overhead": 214.46, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.016693, "characteristics.90th_percentile_latency_ns": 5016693.0, "characteristics.90th_percentile_latency_s": 0.005016693, "characteristics.90th_percentile_latency_us": 5016.693, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.power": 0.11072741731767792, "characteristics.power.normalized_per_core": 0.000922728477647316, "characteristics.power.normalized_per_processor": 0.11072741731767792, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "835c4c1f8ce7ebfc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7446929, "90.00 percentile latency (ns)": 9102716, "90th percentile latency (ns)": 9102716, "95.00 percentile latency (ns)": 11797846, "97.00 percentile latency (ns)": 13773039, "99.00 percentile latency (ns)": 18643532, "99.90 percentile latency (ns)": 78123440, "Max latency (ns)": 124748973, "Mean latency (ns)": 8213634, "Min duration satisfied": "Yes", "Min latency (ns)": 6851446, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 121.43, "QPS w/o loadgen overhead": 121.75, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.102716, "characteristics.90th_percentile_latency_ns": 9102716.0, "characteristics.90th_percentile_latency_s": 0.009102716, "characteristics.90th_percentile_latency_us": 9102.716, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.power": 0.2078457289839437, "characteristics.power.normalized_per_core": 0.0017320477415328642, "characteristics.power.normalized_per_processor": 0.2078457289839437, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f5ad4433413444fd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6349189, "90.00 percentile latency (ns)": 9507336, "90th percentile latency (ns)": 9507336, "95.00 percentile latency (ns)": 12269780, "97.00 percentile latency (ns)": 13384653, "99.00 percentile latency (ns)": 16090393, "99.90 percentile latency (ns)": 74508995, "Max latency (ns)": 134802278, "Mean latency (ns)": 7270800, "Min duration satisfied": "Yes", "Min latency (ns)": 5648289, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 137.37, "QPS w/o loadgen overhead": 137.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.507336, "characteristics.90th_percentile_latency_ns": 9507336.0, "characteristics.90th_percentile_latency_s": 0.009507336, "characteristics.90th_percentile_latency_us": 9507.336, "characteristics.accuracy": 64.972, "characteristics.good": 32486, "characteristics.power": 0.14546201256945954, "characteristics.power.normalized_per_core": 0.0012121834380788294, "characteristics.power.normalized_per_processor": 0.14546201256945954, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1cf4c04839a00d13", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9166415, "90.00 percentile latency (ns)": 13995445, "90th percentile latency (ns)": 13995445, "95.00 percentile latency (ns)": 15629134, "97.00 percentile latency (ns)": 16509242, "99.00 percentile latency (ns)": 25462351, "99.90 percentile latency (ns)": 86192017, "Max latency (ns)": 127894700, "Mean latency (ns)": 10510643, "Min duration satisfied": "Yes", "Min latency (ns)": 8293926, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 94.97, "QPS w/o loadgen overhead": 95.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.995445, "characteristics.90th_percentile_latency_ns": 13995445.0, "characteristics.90th_percentile_latency_s": 0.013995445, "characteristics.90th_percentile_latency_us": 13995.445, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.power": 0.2707006995412441, "characteristics.power.normalized_per_core": 0.0022558391628437007, "characteristics.power.normalized_per_processor": 0.2707006995412441, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f5873483db8739bf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4933922, "90.00 percentile latency (ns)": 7797315, "90th percentile latency (ns)": 7797315, "95.00 percentile latency (ns)": 9506099, "97.00 percentile latency (ns)": 10729883, "99.00 percentile latency (ns)": 12885174, "99.90 percentile latency (ns)": 68088157, "Max latency (ns)": 129310893, "Mean latency (ns)": 5789391, "Min duration satisfied": "Yes", "Min latency (ns)": 4143552, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 172.14, "QPS w/o loadgen overhead": 172.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.797315, "characteristics.90th_percentile_latency_ns": 7797315.0, "characteristics.90th_percentile_latency_s": 0.007797315, "characteristics.90th_percentile_latency_us": 7797.315, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.power": 0.14102882857762503, "characteristics.power.normalized_per_core": 0.0011752402381468752, "characteristics.power.normalized_per_processor": 0.14102882857762503, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "94a0d36b628e6a2c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 1756273, "90.00 percentile latency (ns)": 2016892, "90th percentile latency (ns)": 2016892, "95.00 percentile latency (ns)": 2393389, "97.00 percentile latency (ns)": 2989833, "99.00 percentile latency (ns)": 4708728, "99.90 percentile latency (ns)": 23756256, "Max latency (ns)": 104490008, "Mean latency (ns)": 1919009, "Min duration satisfied": "Yes", "Min latency (ns)": 1310140, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 519.27, "QPS w/o loadgen overhead": 521.1, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.016892, "characteristics.90th_percentile_latency_ns": 2016892.0, "characteristics.90th_percentile_latency_s": 0.002016892, "characteristics.90th_percentile_latency_us": 2016.892, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.power": 0.04145386956918057, "characteristics.power.normalized_per_core": 0.00034544891307650475, "characteristics.power.normalized_per_processor": 0.04145386956918057, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f31435499984a478", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2918155, "90.00 percentile latency (ns)": 3288427, "90th percentile latency (ns)": 3288427, "95.00 percentile latency (ns)": 3887513, "97.00 percentile latency (ns)": 4458859, "99.00 percentile latency (ns)": 6813340, "99.90 percentile latency (ns)": 33989565, "Max latency (ns)": 127548628, "Mean latency (ns)": 3159451, "Min duration satisfied": "Yes", "Min latency (ns)": 2424800, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 315.22, "QPS w/o loadgen overhead": 316.51, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.288427, "characteristics.90th_percentile_latency_ns": 3288427.0, "characteristics.90th_percentile_latency_s": 0.003288427, "characteristics.90th_percentile_latency_us": 3288.427, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.power": 0.07223318454882977, "characteristics.power.normalized_per_core": 0.0006019432045735813, "characteristics.power.normalized_per_processor": 0.07223318454882977, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8c48adacc95334f9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3073165, "90.00 percentile latency (ns)": 3740908, "90th percentile latency (ns)": 3740908, "95.00 percentile latency (ns)": 4767984, "97.00 percentile latency (ns)": 5522192, "99.00 percentile latency (ns)": 8243549, "99.90 percentile latency (ns)": 39900496, "Max latency (ns)": 80866685, "Mean latency (ns)": 3405683, "Min duration satisfied": "Yes", "Min latency (ns)": 2764482, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 292.48, "QPS w/o loadgen overhead": 293.63, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.740908, "characteristics.90th_percentile_latency_ns": 3740908.0, "characteristics.90th_percentile_latency_s": 0.003740908, "characteristics.90th_percentile_latency_us": 3740.908, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.power": 0.08846718431420815, "characteristics.power.normalized_per_core": 0.0007372265359517346, "characteristics.power.normalized_per_processor": 0.08846718431420815, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3519eedc512975fe", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3314159, "90.00 percentile latency (ns)": 3877601, "90th percentile latency (ns)": 3877601, "95.00 percentile latency (ns)": 4813913, "97.00 percentile latency (ns)": 5623902, "99.00 percentile latency (ns)": 9230497, "99.90 percentile latency (ns)": 34872865, "Max latency (ns)": 128444115, "Mean latency (ns)": 3648134, "Min duration satisfied": "Yes", "Min latency (ns)": 2894146, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 273.68, "QPS w/o loadgen overhead": 274.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.877601, "characteristics.90th_percentile_latency_ns": 3877601.0, "characteristics.90th_percentile_latency_s": 0.003877601, "characteristics.90th_percentile_latency_us": 3877.601, "characteristics.accuracy": 55.54, "characteristics.good": 27770, "characteristics.power": 0.07152873945403994, "characteristics.power.normalized_per_core": 0.0005960728287836662, "characteristics.power.normalized_per_processor": 0.07152873945403994, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a9764ee99c90c3e0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3589285, "90.00 percentile latency (ns)": 4380112, "90th percentile latency (ns)": 4380112, "95.00 percentile latency (ns)": 5313444, "97.00 percentile latency (ns)": 6337879, "99.00 percentile latency (ns)": 9495915, "99.90 percentile latency (ns)": 36858415, "Max latency (ns)": 133198777, "Mean latency (ns)": 3955704, "Min duration satisfied": "Yes", "Min latency (ns)": 3099381, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 251.71, "QPS w/o loadgen overhead": 252.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.380112, "characteristics.90th_percentile_latency_ns": 4380112.0, "characteristics.90th_percentile_latency_s": 0.004380112, "characteristics.90th_percentile_latency_us": 4380.112, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.power": 0.0926330488812611, "characteristics.power.normalized_per_core": 0.0007719420740105092, "characteristics.power.normalized_per_processor": 0.0926330488812611, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 120, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0cba94daf145a98c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 34532907, "90.00 percentile latency (ns)": 39326003, "90th percentile latency (ns)": 39326003, "95.00 percentile latency (ns)": 45953876, "97.00 percentile latency (ns)": 54877565, "99.00 percentile latency (ns)": 98724154, "99.90 percentile latency (ns)": 120949711, "Max latency (ns)": 136593332, "Mean latency (ns)": 36664927, "Min duration satisfied": "Yes", "Min latency (ns)": 33392916, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 27.26, "QPS w/o loadgen overhead": 27.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 39.326003, "characteristics.90th_percentile_latency_ns": 39326003.0, "characteristics.90th_percentile_latency_s": 0.039326003, "characteristics.90th_percentile_latency_us": 39326.003, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.power": 0.2528117437152317, "characteristics.power.normalized_per_core": 0.002106764530960264, "characteristics.power.normalized_per_processor": 0.2528117437152317, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.027, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ce21ccb4644c1a9a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 43773134, "90.00 percentile latency (ns)": 51124924, "90th percentile latency (ns)": 51124924, "95.00 percentile latency (ns)": 59814121, "97.00 percentile latency (ns)": 66967734, "99.00 percentile latency (ns)": 123343971, "99.90 percentile latency (ns)": 169708038, "Max latency (ns)": 191882174, "Mean latency (ns)": 46643029, "Min duration satisfied": "Yes", "Min latency (ns)": 42852081, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.43, "QPS w/o loadgen overhead": 21.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 51.124924, "characteristics.90th_percentile_latency_ns": 51124924.0, "characteristics.90th_percentile_latency_s": 0.051124924, "characteristics.90th_percentile_latency_us": 51124.924, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.power": 0.3136123944187765, "characteristics.power.normalized_per_core": 0.0026134366201564707, "characteristics.power.normalized_per_processor": 0.3136123944187765, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4310842e08f4dc27", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 162527843, "90.00 percentile latency (ns)": 182276944, "90th percentile latency (ns)": 182276944, "95.00 percentile latency (ns)": 184623681, "97.00 percentile latency (ns)": 186921712, "99.00 percentile latency (ns)": 200297956, "99.90 percentile latency (ns)": 313507522, "Max latency (ns)": 323690308, "Mean latency (ns)": 167799895, "Min duration satisfied": "Yes", "Min latency (ns)": 160589951, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.96, "QPS w/o loadgen overhead": 5.96, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 182.276944, "characteristics.90th_percentile_latency_ns": 182276944.0, "characteristics.90th_percentile_latency_s": 0.182276944, "characteristics.90th_percentile_latency_us": 182276.944, "characteristics.accuracy": 78.514, "characteristics.good": 39257, "characteristics.power": 1.2648425428983519, "characteristics.power.normalized_per_core": 0.010540354524152933, "characteristics.power.normalized_per_processor": 1.2648425428983519, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 5.91716, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d4bf586825e4c17c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12007086, "90.00 percentile latency (ns)": 12854829, "90th percentile latency (ns)": 12854829, "95.00 percentile latency (ns)": 15280328, "97.00 percentile latency (ns)": 18836620, "99.00 percentile latency (ns)": 36646158, "99.90 percentile latency (ns)": 127101501, "Max latency (ns)": 149966587, "Mean latency (ns)": 13009009, "Min duration satisfied": "Yes", "Min latency (ns)": 11189312, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 76.6, "QPS w/o loadgen overhead": 76.87, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.854829, "characteristics.90th_percentile_latency_ns": 12854829.0, "characteristics.90th_percentile_latency_s": 0.012854829, "characteristics.90th_percentile_latency_us": 12854.829, "characteristics.accuracy": 63.542, "characteristics.good": 31771, "characteristics.power": 0.09363496595460033, "characteristics.power.normalized_per_core": 0.0007802913829550028, "characteristics.power.normalized_per_processor": 0.09363496595460033, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1edf6f8ff4f1b831", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8576081, "90.00 percentile latency (ns)": 9265739, "90th percentile latency (ns)": 9265739, "95.00 percentile latency (ns)": 9942817, "97.00 percentile latency (ns)": 12766893, "99.00 percentile latency (ns)": 27992931, "99.90 percentile latency (ns)": 113449609, "Max latency (ns)": 133533685, "Mean latency (ns)": 9296090, "Min duration satisfied": "Yes", "Min latency (ns)": 7714359, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 106.79, "QPS w/o loadgen overhead": 107.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.265739, "characteristics.90th_percentile_latency_ns": 9265739.0, "characteristics.90th_percentile_latency_s": 0.009265739, "characteristics.90th_percentile_latency_us": 9265.739, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.power": 0.06213402377206775, "characteristics.power.normalized_per_core": 0.0005177835314338979, "characteristics.power.normalized_per_processor": 0.06213402377206775, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "cb3745e6d7e8e395", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10270733, "90.00 percentile latency (ns)": 11133435, "90th percentile latency (ns)": 11133435, "95.00 percentile latency (ns)": 12503942, "97.00 percentile latency (ns)": 15686092, "99.00 percentile latency (ns)": 33600912, "99.90 percentile latency (ns)": 117713711, "Max latency (ns)": 191092379, "Mean latency (ns)": 11184176, "Min duration satisfied": "Yes", "Min latency (ns)": 9476083, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.04, "QPS w/o loadgen overhead": 89.41, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.133435, "characteristics.90th_percentile_latency_ns": 11133435.0, "characteristics.90th_percentile_latency_s": 0.011133435, "characteristics.90th_percentile_latency_us": 11133.435, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.power": 0.07523764705177627, "characteristics.power.normalized_per_core": 0.0006269803920981356, "characteristics.power.normalized_per_processor": 0.07523764705177627, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a943c174334b59ed", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22509615, "90.00 percentile latency (ns)": 23396379, "90th percentile latency (ns)": 23396379, "95.00 percentile latency (ns)": 27682763, "97.00 percentile latency (ns)": 32576571, "99.00 percentile latency (ns)": 49340640, "99.90 percentile latency (ns)": 138339465, "Max latency (ns)": 154939383, "Mean latency (ns)": 23898280, "Min duration satisfied": "Yes", "Min latency (ns)": 21913670, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.78, "QPS w/o loadgen overhead": 41.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.396379, "characteristics.90th_percentile_latency_ns": 23396379.0, "characteristics.90th_percentile_latency_s": 0.023396379, "characteristics.90th_percentile_latency_us": 23396.379, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.power": 0.1519611010983697, "characteristics.power.normalized_per_core": 0.0012663425091530808, "characteristics.power.normalized_per_processor": 0.1519611010983697, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8d92983dff1fdc18", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3881768, "90.00 percentile latency (ns)": 4595420, "90th percentile latency (ns)": 4595420, "95.00 percentile latency (ns)": 4803786, "97.00 percentile latency (ns)": 4998022, "99.00 percentile latency (ns)": 12090695, "99.90 percentile latency (ns)": 62218277, "Max latency (ns)": 97802116, "Mean latency (ns)": 4300641, "Min duration satisfied": "Yes", "Min latency (ns)": 3348335, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 230.48, "QPS w/o loadgen overhead": 232.52, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.59542, "characteristics.90th_percentile_latency_ns": 4595420.0, "characteristics.90th_percentile_latency_s": 0.00459542, "characteristics.90th_percentile_latency_us": 4595.42, "characteristics.accuracy": 48.162, "characteristics.good": 24081, "characteristics.power": 0.031002854886715673, "characteristics.power.normalized_per_core": 0.0002583571240559639, "characteristics.power.normalized_per_processor": 0.031002854886715673, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6b58894736a2a0c9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 68114293, "90.00 percentile latency (ns)": 78796789, "90th percentile latency (ns)": 78796789, "95.00 percentile latency (ns)": 87000206, "97.00 percentile latency (ns)": 88519149, "99.00 percentile latency (ns)": 93004031, "99.90 percentile latency (ns)": 167370756, "Max latency (ns)": 205512779, "Mean latency (ns)": 70434336, "Min duration satisfied": "Yes", "Min latency (ns)": 66763035, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.19, "QPS w/o loadgen overhead": 14.2, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 78.796789, "characteristics.90th_percentile_latency_ns": 78796789.0, "characteristics.90th_percentile_latency_s": 0.078796789, "characteristics.90th_percentile_latency_us": 78796.789, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.power": 0.48549872002630456, "characteristics.power.normalized_per_core": 0.004045822666885871, "characteristics.power.normalized_per_processor": 0.48549872002630456, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.2857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e688b3ab236456a9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5010197, "90.00 percentile latency (ns)": 5623287, "90th percentile latency (ns)": 5623287, "95.00 percentile latency (ns)": 5872621, "97.00 percentile latency (ns)": 6443217, "99.00 percentile latency (ns)": 16735749, "99.90 percentile latency (ns)": 64558991, "Max latency (ns)": 108994418, "Mean latency (ns)": 5477952, "Min duration satisfied": "Yes", "Min latency (ns)": 4422893, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 181.1, "QPS w/o loadgen overhead": 182.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.623287, "characteristics.90th_percentile_latency_ns": 5623287.0, "characteristics.90th_percentile_latency_s": 0.005623287, "characteristics.90th_percentile_latency_us": 5623.287, "characteristics.accuracy": 50.242, "characteristics.good": 25121, "characteristics.power": 0.03940001325205407, "characteristics.power.normalized_per_core": 0.0003283334437671172, "characteristics.power.normalized_per_processor": 0.03940001325205407, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f4057bb25f79447b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14008338, "90.00 percentile latency (ns)": 14763228, "90th percentile latency (ns)": 14763228, "95.00 percentile latency (ns)": 17497790, "97.00 percentile latency (ns)": 20131609, "99.00 percentile latency (ns)": 38395913, "99.90 percentile latency (ns)": 85823477, "Max latency (ns)": 113941198, "Mean latency (ns)": 14960283, "Min duration satisfied": "Yes", "Min latency (ns)": 13211273, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 66.73, "QPS w/o loadgen overhead": 66.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.763228, "characteristics.90th_percentile_latency_ns": 14763228.0, "characteristics.90th_percentile_latency_s": 0.014763228, "characteristics.90th_percentile_latency_us": 14763.228, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.power": 0.10272187646580154, "characteristics.power.normalized_per_core": 0.0008560156372150129, "characteristics.power.normalized_per_processor": 0.10272187646580154, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "04a79bc4da482780", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 32675962, "90.00 percentile latency (ns)": 37019139, "90th percentile latency (ns)": 37019139, "95.00 percentile latency (ns)": 44514868, "97.00 percentile latency (ns)": 50852171, "99.00 percentile latency (ns)": 68343705, "99.90 percentile latency (ns)": 158531009, "Max latency (ns)": 171913564, "Mean latency (ns)": 34921442, "Min duration satisfied": "Yes", "Min latency (ns)": 31802194, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 28.61, "QPS w/o loadgen overhead": 28.64, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 37.019139, "characteristics.90th_percentile_latency_ns": 37019139.0, "characteristics.90th_percentile_latency_s": 0.037019139, "characteristics.90th_percentile_latency_us": 37019.139, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.power": 0.23622320636906985, "characteristics.power.normalized_per_core": 0.001968526719742249, "characteristics.power.normalized_per_processor": 0.23622320636906985, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 28.5714, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "51ce283f296d4b7d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 47017344, "90.00 percentile latency (ns)": 52988872, "90th percentile latency (ns)": 52988872, "95.00 percentile latency (ns)": 65916160, "97.00 percentile latency (ns)": 69427968, "99.00 percentile latency (ns)": 73006935, "99.90 percentile latency (ns)": 174037873, "Max latency (ns)": 213172985, "Mean latency (ns)": 48963056, "Min duration satisfied": "Yes", "Min latency (ns)": 45652574, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.41, "QPS w/o loadgen overhead": 20.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 52.988872, "characteristics.90th_percentile_latency_ns": 52988872.0, "characteristics.90th_percentile_latency_s": 0.052988872, "characteristics.90th_percentile_latency_us": 52988.872, "characteristics.accuracy": 74.098, "characteristics.good": 37049, "characteristics.power": 0.36602038766942635, "characteristics.power.normalized_per_core": 0.0030501698972452197, "characteristics.power.normalized_per_processor": 0.36602038766942635, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20.4082, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "496c815ade3f4e73", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8984906, "90.00 percentile latency (ns)": 9740225, "90th percentile latency (ns)": 9740225, "95.00 percentile latency (ns)": 10883906, "97.00 percentile latency (ns)": 13704323, "99.00 percentile latency (ns)": 30142370, "99.90 percentile latency (ns)": 122017957, "Max latency (ns)": 143097176, "Mean latency (ns)": 9728868, "Min duration satisfied": "Yes", "Min latency (ns)": 8429137, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 102.43, "QPS w/o loadgen overhead": 102.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.740225, "characteristics.90th_percentile_latency_ns": 9740225.0, "characteristics.90th_percentile_latency_s": 0.009740225, "characteristics.90th_percentile_latency_us": 9740.225, "characteristics.accuracy": 61.924, "characteristics.good": 30962, "characteristics.power": 0.06960576625827766, "characteristics.power.normalized_per_core": 0.0005800480521523138, "characteristics.power.normalized_per_processor": 0.06960576625827766, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1e4ab1dc0a4d2989", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10276326, "90.00 percentile latency (ns)": 11014885, "90th percentile latency (ns)": 11014885, "95.00 percentile latency (ns)": 13102960, "97.00 percentile latency (ns)": 15888231, "99.00 percentile latency (ns)": 34197366, "99.90 percentile latency (ns)": 81389885, "Max latency (ns)": 124497129, "Mean latency (ns)": 11138885, "Min duration satisfied": "Yes", "Min latency (ns)": 9708112, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.5, "QPS w/o loadgen overhead": 89.78, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.014885, "characteristics.90th_percentile_latency_ns": 11014885.0, "characteristics.90th_percentile_latency_s": 0.011014885, "characteristics.90th_percentile_latency_us": 11014.885, "characteristics.accuracy": 62.298, "characteristics.good": 31149, "characteristics.power": 0.0808651383001152, "characteristics.power.normalized_per_core": 0.00067387615250096, "characteristics.power.normalized_per_processor": 0.0808651383001152, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0bcf1f1ced3d43ed", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4138835, "90.00 percentile latency (ns)": 5018704, "90th percentile latency (ns)": 5018704, "95.00 percentile latency (ns)": 5212422, "97.00 percentile latency (ns)": 5422752, "99.00 percentile latency (ns)": 11750595, "99.90 percentile latency (ns)": 93535491, "Max latency (ns)": 132905439, "Mean latency (ns)": 4644423, "Min duration satisfied": "Yes", "Min latency (ns)": 3725641, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 213.31, "QPS w/o loadgen overhead": 215.31, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.018704, "characteristics.90th_percentile_latency_ns": 5018704.0, "characteristics.90th_percentile_latency_s": 0.005018704, "characteristics.90th_percentile_latency_us": 5018.704, "characteristics.accuracy": 49.12, "characteristics.good": 24560, "characteristics.power": 0.032919926804151206, "characteristics.power.normalized_per_core": 0.0002743327233679267, "characteristics.power.normalized_per_processor": 0.032919926804151206, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7082d1449b1a952b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 39765424, "90.00 percentile latency (ns)": 46728142, "90th percentile latency (ns)": 46728142, "95.00 percentile latency (ns)": 56157089, "97.00 percentile latency (ns)": 62053207, "99.00 percentile latency (ns)": 88323106, "99.90 percentile latency (ns)": 170060321, "Max latency (ns)": 181621239, "Mean latency (ns)": 42294699, "Min duration satisfied": "Yes", "Min latency (ns)": 38417804, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.63, "QPS w/o loadgen overhead": 23.64, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 46.728142, "characteristics.90th_percentile_latency_ns": 46728142.0, "characteristics.90th_percentile_latency_s": 0.046728142, "characteristics.90th_percentile_latency_us": 46728.142, "characteristics.accuracy": 73.584, "characteristics.good": 36792, "characteristics.power": 0.31140696103075344, "characteristics.power.normalized_per_core": 0.002595058008589612, "characteristics.power.normalized_per_processor": 0.31140696103075344, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 24.3902, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "945c4c5d4b8da323", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28526194, "90.00 percentile latency (ns)": 32052356, "90th percentile latency (ns)": 32052356, "95.00 percentile latency (ns)": 39998975, "97.00 percentile latency (ns)": 47701080, "99.00 percentile latency (ns)": 74037843, "99.90 percentile latency (ns)": 117582515, "Max latency (ns)": 128979463, "Mean latency (ns)": 30419910, "Min duration satisfied": "Yes", "Min latency (ns)": 27629770, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 32.84, "QPS w/o loadgen overhead": 32.87, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 32.052356, "characteristics.90th_percentile_latency_ns": 32052356.0, "characteristics.90th_percentile_latency_s": 0.032052356, "characteristics.90th_percentile_latency_us": 32052.356, "characteristics.accuracy": 70.772, "characteristics.good": 35386, "characteristics.power": 0.22406147743973226, "characteristics.power.normalized_per_core": 0.0018671789786644355, "characteristics.power.normalized_per_processor": 0.22406147743973226, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 32.2581, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bb80b2b0372d84eb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7099370, "90.00 percentile latency (ns)": 7383863, "90th percentile latency (ns)": 7383863, "95.00 percentile latency (ns)": 7712412, "97.00 percentile latency (ns)": 9051495, "99.00 percentile latency (ns)": 20210444, "99.90 percentile latency (ns)": 65845855, "Max latency (ns)": 87378124, "Mean latency (ns)": 7584050, "Min duration satisfied": "Yes", "Min latency (ns)": 6570139, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 131.55, "QPS w/o loadgen overhead": 131.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.383863, "characteristics.90th_percentile_latency_ns": 7383863.0, "characteristics.90th_percentile_latency_s": 0.007383863, "characteristics.90th_percentile_latency_us": 7383.863, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.power": 0.05026098678342653, "characteristics.power.normalized_per_core": 0.00041884155652855445, "characteristics.power.normalized_per_processor": 0.05026098678342653, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f9627db16e4b1193", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16839929, "90.00 percentile latency (ns)": 17821295, "90th percentile latency (ns)": 17821295, "95.00 percentile latency (ns)": 21972200, "97.00 percentile latency (ns)": 27797716, "99.00 percentile latency (ns)": 43438713, "99.90 percentile latency (ns)": 134727386, "Max latency (ns)": 169433832, "Mean latency (ns)": 18144616, "Min duration satisfied": "Yes", "Min latency (ns)": 15903748, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 54.99, "QPS w/o loadgen overhead": 55.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.821295, "characteristics.90th_percentile_latency_ns": 17821295.0, "characteristics.90th_percentile_latency_s": 0.017821295, "characteristics.90th_percentile_latency_us": 17821.295, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.power": 0.12244880020562364, "characteristics.power.normalized_per_core": 0.001020406668380197, "characteristics.power.normalized_per_processor": 0.12244880020562364, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8548c43d604503b9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13245614, "90.00 percentile latency (ns)": 13646700, "90th percentile latency (ns)": 13646700, "95.00 percentile latency (ns)": 14244816, "97.00 percentile latency (ns)": 16398472, "99.00 percentile latency (ns)": 38559352, "99.90 percentile latency (ns)": 83205152, "Max latency (ns)": 100191371, "Mean latency (ns)": 14007950, "Min duration satisfied": "Yes", "Min latency (ns)": 12576368, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 71.27, "QPS w/o loadgen overhead": 71.39, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.6467, "characteristics.90th_percentile_latency_ns": 13646700.0, "characteristics.90th_percentile_latency_s": 0.0136467, "characteristics.90th_percentile_latency_us": 13646.7, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.power": 0.08824521206117691, "characteristics.power.normalized_per_core": 0.0007353767671764743, "characteristics.power.normalized_per_processor": 0.08824521206117691, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3873e8a4170b61da", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6977163, "90.00 percentile latency (ns)": 7320877, "90th percentile latency (ns)": 7320877, "95.00 percentile latency (ns)": 7654554, "97.00 percentile latency (ns)": 10741339, "99.00 percentile latency (ns)": 21305293, "99.90 percentile latency (ns)": 111350419, "Max latency (ns)": 137543602, "Mean latency (ns)": 7512169, "Min duration satisfied": "Yes", "Min latency (ns)": 6462432, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 132.79, "QPS w/o loadgen overhead": 133.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.320877, "characteristics.90th_percentile_latency_ns": 7320877.0, "characteristics.90th_percentile_latency_s": 0.007320877, "characteristics.90th_percentile_latency_us": 7320.877, "characteristics.accuracy": 59.226, "characteristics.good": 29613, "characteristics.power": 0.053534771640498524, "characteristics.power.normalized_per_core": 0.00044612309700415437, "characteristics.power.normalized_per_processor": 0.053534771640498524, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d339011079e2d43c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15791993, "90.00 percentile latency (ns)": 16584791, "90th percentile latency (ns)": 16584791, "95.00 percentile latency (ns)": 20937862, "97.00 percentile latency (ns)": 26775939, "99.00 percentile latency (ns)": 41226422, "99.90 percentile latency (ns)": 88537686, "Max latency (ns)": 128347823, "Mean latency (ns)": 16971607, "Min duration satisfied": "Yes", "Min latency (ns)": 15018510, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 58.83, "QPS w/o loadgen overhead": 58.92, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.584791, "characteristics.90th_percentile_latency_ns": 16584791.0, "characteristics.90th_percentile_latency_s": 0.016584791, "characteristics.90th_percentile_latency_us": 16584.791, "characteristics.accuracy": 68.248, "characteristics.good": 34124, "characteristics.power": 0.1246548782774876, "characteristics.power.normalized_per_core": 0.0010387906523123967, "characteristics.power.normalized_per_processor": 0.1246548782774876, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5aaf5f478da9debc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6217528, "90.00 percentile latency (ns)": 6561392, "90th percentile latency (ns)": 6561392, "95.00 percentile latency (ns)": 6796458, "97.00 percentile latency (ns)": 9169612, "99.00 percentile latency (ns)": 17580889, "99.90 percentile latency (ns)": 113262179, "Max latency (ns)": 142245332, "Mean latency (ns)": 6700219, "Min duration satisfied": "Yes", "Min latency (ns)": 5747502, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 148.79, "QPS w/o loadgen overhead": 149.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.561392, "characteristics.90th_percentile_latency_ns": 6561392.0, "characteristics.90th_percentile_latency_s": 0.006561392, "characteristics.90th_percentile_latency_us": 6561.392, "characteristics.accuracy": 59.12, "characteristics.good": 29560, "characteristics.power": 0.04770806729842947, "characteristics.power.normalized_per_core": 0.0003975672274869122, "characteristics.power.normalized_per_processor": 0.04770806729842947, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d11d40e4a5c75c62", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6965805, "90.00 percentile latency (ns)": 7642010, "90th percentile latency (ns)": 7642010, "95.00 percentile latency (ns)": 7991353, "97.00 percentile latency (ns)": 10915038, "99.00 percentile latency (ns)": 24474601, "99.90 percentile latency (ns)": 70594598, "Max latency (ns)": 106032218, "Mean latency (ns)": 7613862, "Min duration satisfied": "Yes", "Min latency (ns)": 6437930, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 130.72, "QPS w/o loadgen overhead": 131.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.64201, "characteristics.90th_percentile_latency_ns": 7642010.0, "characteristics.90th_percentile_latency_s": 0.00764201, "characteristics.90th_percentile_latency_us": 7642.01, "characteristics.accuracy": 58.46, "characteristics.good": 29230, "characteristics.power": 0.05517774224887734, "characteristics.power.normalized_per_core": 0.0004598145187406445, "characteristics.power.normalized_per_processor": 0.05517774224887734, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b40d59e416d84a3d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26134575, "90.00 percentile latency (ns)": 27921923, "90th percentile latency (ns)": 27921923, "95.00 percentile latency (ns)": 36715841, "97.00 percentile latency (ns)": 44841107, "99.00 percentile latency (ns)": 54223123, "99.90 percentile latency (ns)": 139575433, "Max latency (ns)": 159080482, "Mean latency (ns)": 27993647, "Min duration satisfied": "Yes", "Min latency (ns)": 25340018, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 35.68, "QPS w/o loadgen overhead": 35.72, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 27.921923, "characteristics.90th_percentile_latency_ns": 27921923.0, "characteristics.90th_percentile_latency_s": 0.027921923, "characteristics.90th_percentile_latency_us": 27921.923, "characteristics.accuracy": 72.91, "characteristics.good": 36455, "characteristics.power": 0.20234811662938576, "characteristics.power.normalized_per_core": 0.0016862343052448812, "characteristics.power.normalized_per_processor": 0.20234811662938576, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 35.7143, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "926e9e7d9aaf4856", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 24078488, "90.00 percentile latency (ns)": 25605844, "90th percentile latency (ns)": 25605844, "95.00 percentile latency (ns)": 33434938, "97.00 percentile latency (ns)": 41040640, "99.00 percentile latency (ns)": 51771559, "99.90 percentile latency (ns)": 146298114, "Max latency (ns)": 165208591, "Mean latency (ns)": 25872950, "Min duration satisfied": "Yes", "Min latency (ns)": 23325692, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 38.59, "QPS w/o loadgen overhead": 38.65, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 25.605844, "characteristics.90th_percentile_latency_ns": 25605844.0, "characteristics.90th_percentile_latency_s": 0.025605844, "characteristics.90th_percentile_latency_us": 25605.844, "characteristics.accuracy": 70.542, "characteristics.good": 35271, "characteristics.power": 0.18949786479819233, "characteristics.power.normalized_per_core": 0.0015791488733182695, "characteristics.power.normalized_per_processor": 0.18949786479819233, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3e27065f2e4afba9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7258242, "90.00 percentile latency (ns)": 7866320, "90th percentile latency (ns)": 7866320, "95.00 percentile latency (ns)": 8260962, "97.00 percentile latency (ns)": 10602765, "99.00 percentile latency (ns)": 22139822, "99.90 percentile latency (ns)": 117789005, "Max latency (ns)": 136487280, "Mean latency (ns)": 7851212, "Min duration satisfied": "Yes", "Min latency (ns)": 6617448, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 126.37, "QPS w/o loadgen overhead": 127.37, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.86632, "characteristics.90th_percentile_latency_ns": 7866320.0, "characteristics.90th_percentile_latency_s": 0.00786632, "characteristics.90th_percentile_latency_us": 7866.32, "characteristics.accuracy": 56.594, "characteristics.good": 28297, "characteristics.power": 0.056393628133704826, "characteristics.power.normalized_per_core": 0.0004699469011142069, "characteristics.power.normalized_per_processor": 0.056393628133704826, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f468eb2f45ff418f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13587144, "90.00 percentile latency (ns)": 14392794, "90th percentile latency (ns)": 14392794, "95.00 percentile latency (ns)": 17830737, "97.00 percentile latency (ns)": 22235712, "99.00 percentile latency (ns)": 39318930, "99.90 percentile latency (ns)": 128975627, "Max latency (ns)": 163752265, "Mean latency (ns)": 14670262, "Min duration satisfied": "Yes", "Min latency (ns)": 12726887, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 67.99, "QPS w/o loadgen overhead": 68.17, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.392794, "characteristics.90th_percentile_latency_ns": 14392794.0, "characteristics.90th_percentile_latency_s": 0.014392794, "characteristics.90th_percentile_latency_us": 14392.794, "characteristics.accuracy": 67.82, "characteristics.good": 33910, "characteristics.power": 0.10643099222801893, "characteristics.power.normalized_per_core": 0.000886924935233491, "characteristics.power.normalized_per_processor": 0.10643099222801893, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2eb6f508c127425b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4743252, "90.00 percentile latency (ns)": 5373071, "90th percentile latency (ns)": 5373071, "95.00 percentile latency (ns)": 5660269, "97.00 percentile latency (ns)": 6284720, "99.00 percentile latency (ns)": 13852577, "99.90 percentile latency (ns)": 61487127, "Max latency (ns)": 82249947, "Mean latency (ns)": 5154507, "Min duration satisfied": "Yes", "Min latency (ns)": 4195226, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 192.2, "QPS w/o loadgen overhead": 194.0, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.373071, "characteristics.90th_percentile_latency_ns": 5373071.0, "characteristics.90th_percentile_latency_s": 0.005373071, "characteristics.90th_percentile_latency_us": 5373.071, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.power": 0.03535962913245717, "characteristics.power.normalized_per_core": 0.0002946635761038097, "characteristics.power.normalized_per_processor": 0.03535962913245717, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0c0b540f14be497d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2929262, "90.00 percentile latency (ns)": 3529894, "90th percentile latency (ns)": 3529894, "95.00 percentile latency (ns)": 3756255, "97.00 percentile latency (ns)": 3926501, "99.00 percentile latency (ns)": 7906950, "99.90 percentile latency (ns)": 60054452, "Max latency (ns)": 113231978, "Mean latency (ns)": 3267606, "Min duration satisfied": "Yes", "Min latency (ns)": 2430200, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 302.15, "QPS w/o loadgen overhead": 306.03, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.529894, "characteristics.90th_percentile_latency_ns": 3529894.0, "characteristics.90th_percentile_latency_s": 0.003529894, "characteristics.90th_percentile_latency_us": 3529.894, "characteristics.accuracy": 45.494, "characteristics.good": 22747, "characteristics.power": 0.023578860970637328, "characteristics.power.normalized_per_core": 0.00019649050808864438, "characteristics.power.normalized_per_processor": 0.023578860970637328, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "fc07690fc45ce97b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 53369721, "90.00 percentile latency (ns)": 62038220, "90th percentile latency (ns)": 62038220, "95.00 percentile latency (ns)": 69507677, "97.00 percentile latency (ns)": 74047876, "99.00 percentile latency (ns)": 127843216, "99.90 percentile latency (ns)": 146172466, "Max latency (ns)": 188733811, "Mean latency (ns)": 56337011, "Min duration satisfied": "Yes", "Min latency (ns)": 51446806, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.74, "QPS w/o loadgen overhead": 17.75, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 62.03822, "characteristics.90th_percentile_latency_ns": 62038220.0, "characteristics.90th_percentile_latency_s": 0.06203822, "characteristics.90th_percentile_latency_us": 62038.22, "characteristics.accuracy": 70.626, "characteristics.good": 35313, "characteristics.power": 0.3930650118736278, "characteristics.power.normalized_per_core": 0.003275541765613565, "characteristics.power.normalized_per_processor": 0.3930650118736278, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 17.8571, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "46c1ab90cb48852f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9132997, "90.00 percentile latency (ns)": 9970741, "90th percentile latency (ns)": 9970741, "95.00 percentile latency (ns)": 10807566, "97.00 percentile latency (ns)": 14134484, "99.00 percentile latency (ns)": 29819753, "99.90 percentile latency (ns)": 122209398, "Max latency (ns)": 145804861, "Mean latency (ns)": 9939874, "Min duration satisfied": "Yes", "Min latency (ns)": 8594025, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 100.12, "QPS w/o loadgen overhead": 100.6, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.970741, "characteristics.90th_percentile_latency_ns": 9970741.0, "characteristics.90th_percentile_latency_s": 0.009970741, "characteristics.90th_percentile_latency_us": 9970.741, "characteristics.accuracy": 63.454, "characteristics.good": 31727, "characteristics.power": 0.07192996474266115, "characteristics.power.normalized_per_core": 0.0005994163728555096, "characteristics.power.normalized_per_processor": 0.07192996474266115, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "54064855af9a2053", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21354059, "90.00 percentile latency (ns)": 22828359, "90th percentile latency (ns)": 22828359, "95.00 percentile latency (ns)": 29568653, "97.00 percentile latency (ns)": 35588204, "99.00 percentile latency (ns)": 48515621, "99.90 percentile latency (ns)": 104193507, "Max latency (ns)": 138614182, "Mean latency (ns)": 22802326, "Min duration satisfied": "Yes", "Min latency (ns)": 20445284, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 43.77, "QPS w/o loadgen overhead": 43.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.828359, "characteristics.90th_percentile_latency_ns": 22828359.0, "characteristics.90th_percentile_latency_s": 0.022828359, "characteristics.90th_percentile_latency_us": 22828.359, "characteristics.accuracy": 70.04, "characteristics.good": 35020, "characteristics.power": 0.1672839463861529, "characteristics.power.normalized_per_core": 0.0013940328865512741, "characteristics.power.normalized_per_processor": 0.1672839463861529, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2407f9dc86e41b66", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 64086092, "90.00 percentile latency (ns)": 76689744, "90th percentile latency (ns)": 76689744, "95.00 percentile latency (ns)": 85120458, "97.00 percentile latency (ns)": 86653321, "99.00 percentile latency (ns)": 90332165, "99.90 percentile latency (ns)": 185866436, "Max latency (ns)": 223747234, "Mean latency (ns)": 66580278, "Min duration satisfied": "Yes", "Min latency (ns)": 62847825, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.01, "QPS w/o loadgen overhead": 15.02, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 76.689744, "characteristics.90th_percentile_latency_ns": 76689744.0, "characteristics.90th_percentile_latency_s": 0.076689744, "characteristics.90th_percentile_latency_us": 76689.744, "characteristics.accuracy": 74.124, "characteristics.good": 37062, "characteristics.power": 0.4991164273472405, "characteristics.power.normalized_per_core": 0.004159303561227004, "characteristics.power.normalized_per_processor": 0.4991164273472405, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.9254, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8bb0762330c14a3b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5950737, "90.00 percentile latency (ns)": 6592612, "90th percentile latency (ns)": 6592612, "95.00 percentile latency (ns)": 6821533, "97.00 percentile latency (ns)": 8796007, "99.00 percentile latency (ns)": 20514546, "99.90 percentile latency (ns)": 66687941, "Max latency (ns)": 114782860, "Mean latency (ns)": 6500467, "Min duration satisfied": "Yes", "Min latency (ns)": 5345067, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 152.81, "QPS w/o loadgen overhead": 153.84, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.592612, "characteristics.90th_percentile_latency_ns": 6592612.0, "characteristics.90th_percentile_latency_s": 0.006592612, "characteristics.90th_percentile_latency_us": 6592.612, "characteristics.accuracy": 59.444, "characteristics.good": 29722, "characteristics.power": 0.04713712940724779, "characteristics.power.normalized_per_core": 0.0003928094117270649, "characteristics.power.normalized_per_processor": 0.04713712940724779, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "25a48089c9b135e2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7948122, "90.00 percentile latency (ns)": 8540090, "90th percentile latency (ns)": 8540090, "95.00 percentile latency (ns)": 9007118, "97.00 percentile latency (ns)": 12204989, "99.00 percentile latency (ns)": 28324605, "99.90 percentile latency (ns)": 71846772, "Max latency (ns)": 110721548, "Mean latency (ns)": 8620162, "Min duration satisfied": "Yes", "Min latency (ns)": 7315768, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 115.52, "QPS w/o loadgen overhead": 116.01, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.54009, "characteristics.90th_percentile_latency_ns": 8540090.0, "characteristics.90th_percentile_latency_s": 0.00854009, "characteristics.90th_percentile_latency_us": 8540.09, "characteristics.accuracy": 61.456, "characteristics.good": 30728, "characteristics.power": 0.062332929362880755, "characteristics.power.normalized_per_core": 0.0005194410780240062, "characteristics.power.normalized_per_processor": 0.062332929362880755, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6667a748ee912a60", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9326776, "90.00 percentile latency (ns)": 10030409, "90th percentile latency (ns)": 10030409, "95.00 percentile latency (ns)": 10898026, "97.00 percentile latency (ns)": 13847856, "99.00 percentile latency (ns)": 30398256, "99.90 percentile latency (ns)": 121367529, "Max latency (ns)": 207652511, "Mean latency (ns)": 10075047, "Min duration satisfied": "Yes", "Min latency (ns)": 8695978, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 98.7, "QPS w/o loadgen overhead": 99.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.030409, "characteristics.90th_percentile_latency_ns": 10030409.0, "characteristics.90th_percentile_latency_s": 0.010030409, "characteristics.90th_percentile_latency_us": 10030.409, "characteristics.accuracy": 58.528, "characteristics.good": 29264, "characteristics.power": 0.07223736862563526, "characteristics.power.normalized_per_core": 0.0006019780718802939, "characteristics.power.normalized_per_processor": 0.07223736862563526, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "419bb82978ffc652", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22602994, "90.00 percentile latency (ns)": 24193087, "90th percentile latency (ns)": 24193087, "95.00 percentile latency (ns)": 31625698, "97.00 percentile latency (ns)": 37766759, "99.00 percentile latency (ns)": 50554493, "99.90 percentile latency (ns)": 140755725, "Max latency (ns)": 160104617, "Mean latency (ns)": 24281553, "Min duration satisfied": "Yes", "Min latency (ns)": 21709733, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 41.08, "QPS w/o loadgen overhead": 41.18, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 24.193087, "characteristics.90th_percentile_latency_ns": 24193087.0, "characteristics.90th_percentile_latency_s": 0.024193087, "characteristics.90th_percentile_latency_us": 24193.087, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.power": 0.16333854278239698, "characteristics.power.normalized_per_core": 0.0013611545231866416, "characteristics.power.normalized_per_processor": 0.16333854278239698, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a881402392568502", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 97960768, "90.00 percentile latency (ns)": 115439688, "90th percentile latency (ns)": 115439688, "95.00 percentile latency (ns)": 118965386, "97.00 percentile latency (ns)": 121057450, "99.00 percentile latency (ns)": 128030163, "99.90 percentile latency (ns)": 242089420, "Max latency (ns)": 250956886, "Mean latency (ns)": 101354147, "Min duration satisfied": "Yes", "Min latency (ns)": 96379397, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 9.86, "QPS w/o loadgen overhead": 9.87, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 115.439688, "characteristics.90th_percentile_latency_ns": 115439688.0, "characteristics.90th_percentile_latency_s": 0.115439688, "characteristics.90th_percentile_latency_us": 115439.688, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.power": 0.7043324848336141, "characteristics.power.normalized_per_core": 0.005869437373613451, "characteristics.power.normalized_per_processor": 0.7043324848336141, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.101, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "77b88720ea94e8d5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18259725, "90.00 percentile latency (ns)": 19213259, "90th percentile latency (ns)": 19213259, "95.00 percentile latency (ns)": 24189772, "97.00 percentile latency (ns)": 30155406, "99.00 percentile latency (ns)": 44343796, "99.90 percentile latency (ns)": 139545153, "Max latency (ns)": 212642500, "Mean latency (ns)": 19651633, "Min duration satisfied": "Yes", "Min latency (ns)": 17592444, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 50.72, "QPS w/o loadgen overhead": 50.89, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.213259, "characteristics.90th_percentile_latency_ns": 19213259.0, "characteristics.90th_percentile_latency_s": 0.019213259, "characteristics.90th_percentile_latency_us": 19213.259, "characteristics.accuracy": 69.604, "characteristics.good": 34802, "characteristics.power": 0.1435184637487993, "characteristics.power.normalized_per_core": 0.001195987197906661, "characteristics.power.normalized_per_processor": 0.1435184637487993, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 52.6316, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "26c9ed64178351dc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 45980817, "90.00 percentile latency (ns)": 52956286, "90th percentile latency (ns)": 52956286, "95.00 percentile latency (ns)": 61841836, "97.00 percentile latency (ns)": 67040577, "99.00 percentile latency (ns)": 118493914, "99.90 percentile latency (ns)": 135724867, "Max latency (ns)": 169987058, "Mean latency (ns)": 48658241, "Min duration satisfied": "Yes", "Min latency (ns)": 44826728, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.55, "QPS w/o loadgen overhead": 20.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 52.956286, "characteristics.90th_percentile_latency_ns": 52956286.0, "characteristics.90th_percentile_latency_s": 0.052956286, "characteristics.90th_percentile_latency_us": 52956.286, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.power": 0.3348259190758953, "characteristics.power.normalized_per_core": 0.002790215992299128, "characteristics.power.normalized_per_processor": 0.3348259190758953, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f27dfc49a6800afa", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19821783, "90.00 percentile latency (ns)": 20388364, "90th percentile latency (ns)": 20388364, "95.00 percentile latency (ns)": 26178361, "97.00 percentile latency (ns)": 32519657, "99.00 percentile latency (ns)": 45494375, "99.90 percentile latency (ns)": 138629103, "Max latency (ns)": 173660990, "Mean latency (ns)": 21226835, "Min duration satisfied": "Yes", "Min latency (ns)": 19057932, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 47.07, "QPS w/o loadgen overhead": 47.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.388364, "characteristics.90th_percentile_latency_ns": 20388364.0, "characteristics.90th_percentile_latency_s": 0.020388364, "characteristics.90th_percentile_latency_us": 20388.364, "characteristics.accuracy": 68.734, "characteristics.good": 34367, "characteristics.power": 0.15466304384002666, "characteristics.power.normalized_per_core": 0.0012888586986668888, "characteristics.power.normalized_per_processor": 0.15466304384002666, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dfebb8af48579194", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16347276, "90.00 percentile latency (ns)": 16836781, "90th percentile latency (ns)": 16836781, "95.00 percentile latency (ns)": 18620591, "97.00 percentile latency (ns)": 21462178, "99.00 percentile latency (ns)": 41224355, "99.90 percentile latency (ns)": 95788116, "Max latency (ns)": 111889290, "Mean latency (ns)": 17281828, "Min duration satisfied": "Yes", "Min latency (ns)": 15775379, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.79, "QPS w/o loadgen overhead": 57.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.836781, "characteristics.90th_percentile_latency_ns": 16836781.0, "characteristics.90th_percentile_latency_s": 0.016836781, "characteristics.90th_percentile_latency_us": 16836.781, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.power": 0.11011374268702233, "characteristics.power.normalized_per_core": 0.0009176145223918527, "characteristics.power.normalized_per_processor": 0.11011374268702233, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e1bfeba024d84b42", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9394916, "90.00 percentile latency (ns)": 10055227, "90th percentile latency (ns)": 10055227, "95.00 percentile latency (ns)": 11281088, "97.00 percentile latency (ns)": 14857920, "99.00 percentile latency (ns)": 33912504, "99.90 percentile latency (ns)": 72943922, "Max latency (ns)": 98971866, "Mean latency (ns)": 10189164, "Min duration satisfied": "Yes", "Min latency (ns)": 8580731, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 97.81, "QPS w/o loadgen overhead": 98.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.055227, "characteristics.90th_percentile_latency_ns": 10055227.0, "characteristics.90th_percentile_latency_s": 0.010055227, "characteristics.90th_percentile_latency_us": 10055.227, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.power": 0.07066252238711854, "characteristics.power.normalized_per_core": 0.0005888543532259878, "characteristics.power.normalized_per_processor": 0.07066252238711854, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3f1eda3a35496b89", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 67937619, "90.00 percentile latency (ns)": 78942707, "90th percentile latency (ns)": 78942707, "95.00 percentile latency (ns)": 86021029, "97.00 percentile latency (ns)": 93294868, "99.00 percentile latency (ns)": 147890276, "99.90 percentile latency (ns)": 167699131, "Max latency (ns)": 173680561, "Mean latency (ns)": 71510085, "Min duration satisfied": "Yes", "Min latency (ns)": 66088362, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.98, "QPS w/o loadgen overhead": 13.98, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 78.942707, "characteristics.90th_percentile_latency_ns": 78942707.0, "characteristics.90th_percentile_latency_s": 0.078942707, "characteristics.90th_percentile_latency_us": 78942.707, "characteristics.accuracy": 71.676, "characteristics.good": 35838, "characteristics.power": 0.5038913845889733, "characteristics.power.normalized_per_core": 0.004199094871574777, "characteristics.power.normalized_per_processor": 0.5038913845889733, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.0845, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a486eb16903f7cec", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3010062, "90.00 percentile latency (ns)": 3596198, "90th percentile latency (ns)": 3596198, "95.00 percentile latency (ns)": 3761915, "97.00 percentile latency (ns)": 3908357, "99.00 percentile latency (ns)": 7884633, "99.90 percentile latency (ns)": 54375709, "Max latency (ns)": 126305450, "Mean latency (ns)": 3331624, "Min duration satisfied": "Yes", "Min latency (ns)": 2460260, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 295.85, "QPS w/o loadgen overhead": 300.15, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.596198, "characteristics.90th_percentile_latency_ns": 3596198.0, "characteristics.90th_percentile_latency_s": 0.003596198, "characteristics.90th_percentile_latency_us": 3596.198, "characteristics.accuracy": 43.468, "characteristics.good": 21734, "characteristics.power": 0.023502287044405448, "characteristics.power.normalized_per_core": 0.00019585239203671206, "characteristics.power.normalized_per_processor": 0.023502287044405448, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "196accfb34cbf367", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 333924933, "90.00 percentile latency (ns)": 352801253, "90th percentile latency (ns)": 352801253, "95.00 percentile latency (ns)": 362539452, "97.00 percentile latency (ns)": 365196629, "99.00 percentile latency (ns)": 374068175, "99.90 percentile latency (ns)": 496080162, "Max latency (ns)": 505116722, "Mean latency (ns)": 341057531, "Min duration satisfied": "Yes", "Min latency (ns)": 328901548, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.93, "QPS w/o loadgen overhead": 2.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 352.801253, "characteristics.90th_percentile_latency_ns": 352801253.0, "characteristics.90th_percentile_latency_s": 0.352801253, "characteristics.90th_percentile_latency_us": 352801.253, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.power": 2.440523948083906, "characteristics.power.normalized_per_core": 0.02033769956736588, "characteristics.power.normalized_per_processor": 2.440523948083906, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.92398, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "586ad300f50124fd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18691472, "90.00 percentile latency (ns)": 19529162, "90th percentile latency (ns)": 19529162, "95.00 percentile latency (ns)": 24637301, "97.00 percentile latency (ns)": 30302573, "99.00 percentile latency (ns)": 43941439, "99.90 percentile latency (ns)": 126977153, "Max latency (ns)": 144543687, "Mean latency (ns)": 20039140, "Min duration satisfied": "Yes", "Min latency (ns)": 17962696, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 49.79, "QPS w/o loadgen overhead": 49.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.529162, "characteristics.90th_percentile_latency_ns": 19529162.0, "characteristics.90th_percentile_latency_s": 0.019529162, "characteristics.90th_percentile_latency_us": 19529.162, "characteristics.accuracy": 70.43, "characteristics.good": 35215, "characteristics.power": 0.14581885545419415, "characteristics.power.normalized_per_core": 0.0012151571287849514, "characteristics.power.normalized_per_processor": 0.14581885545419415, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "29e0a9668131b888", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15124990, "90.00 percentile latency (ns)": 16032379, "90th percentile latency (ns)": 16032379, "95.00 percentile latency (ns)": 19827590, "97.00 percentile latency (ns)": 24885007, "99.00 percentile latency (ns)": 40224033, "99.90 percentile latency (ns)": 132115389, "Max latency (ns)": 149317204, "Mean latency (ns)": 16329790, "Min duration satisfied": "Yes", "Min latency (ns)": 14234105, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 61.09, "QPS w/o loadgen overhead": 61.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.032379, "characteristics.90th_percentile_latency_ns": 16032379.0, "characteristics.90th_percentile_latency_s": 0.016032379, "characteristics.90th_percentile_latency_us": 16032.379, "characteristics.accuracy": 67.474, "characteristics.good": 33737, "characteristics.power": 0.11843176411532354, "characteristics.power.normalized_per_core": 0.0009869313676276962, "characteristics.power.normalized_per_processor": 0.11843176411532354, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ed0f6f64197a1e25", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13639736, "90.00 percentile latency (ns)": 14444997, "90th percentile latency (ns)": 14444997, "95.00 percentile latency (ns)": 18159507, "97.00 percentile latency (ns)": 22849868, "99.00 percentile latency (ns)": 37835130, "99.90 percentile latency (ns)": 88483865, "Max latency (ns)": 133366342, "Mean latency (ns)": 14756086, "Min duration satisfied": "Yes", "Min latency (ns)": 12963288, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 67.61, "QPS w/o loadgen overhead": 67.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.444997, "characteristics.90th_percentile_latency_ns": 14444997.0, "characteristics.90th_percentile_latency_s": 0.014444997, "characteristics.90th_percentile_latency_us": 14444.997, "characteristics.accuracy": 67.24, "characteristics.good": 33620, "characteristics.power": 0.10839101369538845, "characteristics.power.normalized_per_core": 0.0009032584474615704, "characteristics.power.normalized_per_processor": 0.10839101369538845, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a6d776f446c847a0", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 25806272, "90.00 percentile latency (ns)": 27311020, "90th percentile latency (ns)": 27311020, "95.00 percentile latency (ns)": 33868249, "97.00 percentile latency (ns)": 41827418, "99.00 percentile latency (ns)": 77262259, "99.90 percentile latency (ns)": 101795999, "Max latency (ns)": 118290725, "Mean latency (ns)": 27398853, "Min duration satisfied": "Yes", "Min latency (ns)": 25105767, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 36.47, "QPS w/o loadgen overhead": 36.5, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 27.31102, "characteristics.90th_percentile_latency_ns": 27311020.0, "characteristics.90th_percentile_latency_s": 0.02731102, "characteristics.90th_percentile_latency_us": 27311.02, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.power": 0.1843145428152497, "characteristics.power.normalized_per_core": 0.001535954523460414, "characteristics.power.normalized_per_processor": 0.1843145428152497, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 35.7143, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b82e5753c4892bb0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19053132, "90.00 percentile latency (ns)": 20049574, "90th percentile latency (ns)": 20049574, "95.00 percentile latency (ns)": 23356756, "97.00 percentile latency (ns)": 28000985, "99.00 percentile latency (ns)": 46920188, "99.90 percentile latency (ns)": 93180731, "Max latency (ns)": 112891740, "Mean latency (ns)": 20266661, "Min duration satisfied": "Yes", "Min latency (ns)": 18494481, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 49.28, "QPS w/o loadgen overhead": 49.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.049574, "characteristics.90th_percentile_latency_ns": 20049574.0, "characteristics.90th_percentile_latency_s": 0.020049574, "characteristics.90th_percentile_latency_us": 20049.574, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.power": 0.13709520311377585, "characteristics.power.normalized_per_core": 0.001142460025948132, "characteristics.power.normalized_per_processor": 0.13709520311377585, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2841ac8b74dc59a7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14978895, "90.00 percentile latency (ns)": 15701303, "90th percentile latency (ns)": 15701303, "95.00 percentile latency (ns)": 18743257, "97.00 percentile latency (ns)": 21746505, "99.00 percentile latency (ns)": 39244511, "99.90 percentile latency (ns)": 130168525, "Max latency (ns)": 163110827, "Mean latency (ns)": 16062937, "Min duration satisfied": "Yes", "Min latency (ns)": 14658530, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 62.19, "QPS w/o loadgen overhead": 62.26, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 15.701303, "characteristics.90th_percentile_latency_ns": 15701303.0, "characteristics.90th_percentile_latency_s": 0.015701303, "characteristics.90th_percentile_latency_us": 15701.303, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.power": 0.1068006438365198, "characteristics.power.normalized_per_core": 0.0008900053653043316, "characteristics.power.normalized_per_processor": 0.1068006438365198, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f914c0bb041b6ad9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26121054, "90.00 percentile latency (ns)": 28995621, "90th percentile latency (ns)": 28995621, "95.00 percentile latency (ns)": 35285101, "97.00 percentile latency (ns)": 41313167, "99.00 percentile latency (ns)": 83243512, "99.90 percentile latency (ns)": 102757433, "Max latency (ns)": 129375723, "Mean latency (ns)": 27798132, "Min duration satisfied": "Yes", "Min latency (ns)": 24852270, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 35.94, "QPS w/o loadgen overhead": 35.97, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 28.995621, "characteristics.90th_percentile_latency_ns": 28995621.0, "characteristics.90th_percentile_latency_s": 0.028995621, "characteristics.90th_percentile_latency_us": 28995.621, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.power": 0.1921003213287148, "characteristics.power.normalized_per_core": 0.0016008360110726233, "characteristics.power.normalized_per_processor": 0.1921003213287148, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 34.4828, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "780a2046e5c51337", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3644033, "90.00 percentile latency (ns)": 4250890, "90th percentile latency (ns)": 4250890, "95.00 percentile latency (ns)": 4484292, "97.00 percentile latency (ns)": 4691639, "99.00 percentile latency (ns)": 9725181, "99.90 percentile latency (ns)": 80592131, "Max latency (ns)": 144056503, "Mean latency (ns)": 4030395, "Min duration satisfied": "Yes", "Min latency (ns)": 3073730, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 245.3, "QPS w/o loadgen overhead": 248.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.25089, "characteristics.90th_percentile_latency_ns": 4250890.0, "characteristics.90th_percentile_latency_s": 0.00425089, "characteristics.90th_percentile_latency_us": 4250.89, "characteristics.accuracy": 49.11, "characteristics.good": 24555, "characteristics.power": 0.02847242605094084, "characteristics.power.normalized_per_core": 0.00023727021709117366, "characteristics.power.normalized_per_processor": 0.02847242605094084, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2e59ad4ac1aba789", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7705480, "90.00 percentile latency (ns)": 8439592, "90th percentile latency (ns)": 8439592, "95.00 percentile latency (ns)": 8851510, "97.00 percentile latency (ns)": 11690486, "99.00 percentile latency (ns)": 23984859, "99.90 percentile latency (ns)": 119576659, "Max latency (ns)": 143654290, "Mean latency (ns)": 8361869, "Min duration satisfied": "Yes", "Min latency (ns)": 7137120, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 118.92, "QPS w/o loadgen overhead": 119.59, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.439592, "characteristics.90th_percentile_latency_ns": 8439592.0, "characteristics.90th_percentile_latency_s": 0.008439592, "characteristics.90th_percentile_latency_us": 8439.592, "characteristics.accuracy": 62.07, "characteristics.good": 31035, "characteristics.power": 0.059994954591321904, "characteristics.power.normalized_per_core": 0.0004999579549276825, "characteristics.power.normalized_per_processor": 0.059994954591321904, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 111.111, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "55d4b3f7c4d59ba6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 15962593, "90.00 percentile latency (ns)": 16541048, "90th percentile latency (ns)": 16541048, "95.00 percentile latency (ns)": 21031589, "97.00 percentile latency (ns)": 25709727, "99.00 percentile latency (ns)": 41201123, "99.90 percentile latency (ns)": 131935496, "Max latency (ns)": 153152332, "Mean latency (ns)": 17171174, "Min duration satisfied": "Yes", "Min latency (ns)": 15072238, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 58.18, "QPS w/o loadgen overhead": 58.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.541048, "characteristics.90th_percentile_latency_ns": 16541048.0, "characteristics.90th_percentile_latency_s": 0.016541048, "characteristics.90th_percentile_latency_us": 16541.048, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.power": 0.11523717363666583, "characteristics.power.normalized_per_core": 0.0009603097803055486, "characteristics.power.normalized_per_processor": 0.11523717363666583, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8d4aa1a09894f701", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2093582, "90.00 percentile latency (ns)": 2776067, "90th percentile latency (ns)": 2776067, "95.00 percentile latency (ns)": 2969504, "97.00 percentile latency (ns)": 3078039, "99.00 percentile latency (ns)": 5575948, "99.90 percentile latency (ns)": 55956867, "Max latency (ns)": 82219182, "Mean latency (ns)": 2414338, "Min duration satisfied": "Yes", "Min latency (ns)": 1633962, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 408.3, "QPS w/o loadgen overhead": 414.19, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 2.776067, "characteristics.90th_percentile_latency_ns": 2776067.0, "characteristics.90th_percentile_latency_s": 0.002776067, "characteristics.90th_percentile_latency_us": 2776.067, "characteristics.accuracy": 42.384, "characteristics.good": 21192, "characteristics.power": 0.017349537065383953, "characteristics.power.normalized_per_core": 0.00014457947554486627, "characteristics.power.normalized_per_processor": 0.017349537065383953, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 333.333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "128d178f4612b3ee", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 84459898, "90.00 percentile latency (ns)": 100162077, "90th percentile latency (ns)": 100162077, "95.00 percentile latency (ns)": 105328694, "97.00 percentile latency (ns)": 110138384, "99.00 percentile latency (ns)": 197134373, "99.90 percentile latency (ns)": 223498136, "Max latency (ns)": 254658903, "Mean latency (ns)": 89179746, "Min duration satisfied": "Yes", "Min latency (ns)": 82869505, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 11.21, "QPS w/o loadgen overhead": 11.21, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 100.162077, "characteristics.90th_percentile_latency_ns": 100162077.0, "characteristics.90th_percentile_latency_s": 0.100162077, "characteristics.90th_percentile_latency_us": 100162.077, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.power": 0.6094566190089696, "characteristics.power.normalized_per_core": 0.0050788051584080805, "characteristics.power.normalized_per_processor": 0.6094566190089696, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 11.6279, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d15f70d00d641a38", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10406777, "90.00 percentile latency (ns)": 11100370, "90th percentile latency (ns)": 11100370, "95.00 percentile latency (ns)": 12772587, "97.00 percentile latency (ns)": 15749132, "99.00 percentile latency (ns)": 34133582, "99.90 percentile latency (ns)": 88889609, "Max latency (ns)": 110195481, "Mean latency (ns)": 11231304, "Min duration satisfied": "Yes", "Min latency (ns)": 9789935, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 88.74, "QPS w/o loadgen overhead": 89.04, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.10037, "characteristics.90th_percentile_latency_ns": 11100370.0, "characteristics.90th_percentile_latency_s": 0.01110037, "characteristics.90th_percentile_latency_us": 11100.37, "characteristics.accuracy": 64.486, "characteristics.good": 32243, "characteristics.power": 0.0807723859405565, "characteristics.power.normalized_per_core": 0.0006731032161713041, "characteristics.power.normalized_per_processor": 0.0807723859405565, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "66f9530854e1ebbb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 131125188, "90.00 percentile latency (ns)": 148971978, "90th percentile latency (ns)": 148971978, "95.00 percentile latency (ns)": 151729123, "97.00 percentile latency (ns)": 153474424, "99.00 percentile latency (ns)": 163857698, "99.90 percentile latency (ns)": 275278770, "Max latency (ns)": 284203765, "Mean latency (ns)": 135080356, "Min duration satisfied": "Yes", "Min latency (ns)": 128946990, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.4, "QPS w/o loadgen overhead": 7.4, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 148.971978, "characteristics.90th_percentile_latency_ns": 148971978.0, "characteristics.90th_percentile_latency_s": 0.148971978, "characteristics.90th_percentile_latency_us": 148971.978, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.power": 0.9463935567606939, "characteristics.power.normalized_per_core": 0.007886612973005783, "characteristics.power.normalized_per_processor": 0.9463935567606939, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.35294, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b459c161425b98ac", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4100408, "90.00 percentile latency (ns)": 4920391, "90th percentile latency (ns)": 4920391, "95.00 percentile latency (ns)": 5080646, "97.00 percentile latency (ns)": 5351955, "99.00 percentile latency (ns)": 13587624, "99.90 percentile latency (ns)": 63240987, "Max latency (ns)": 78657841, "Mean latency (ns)": 4597181, "Min duration satisfied": "Yes", "Min latency (ns)": 3661400, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 215.83, "QPS w/o loadgen overhead": 217.52, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.920391, "characteristics.90th_percentile_latency_ns": 4920391.0, "characteristics.90th_percentile_latency_s": 0.004920391, "characteristics.90th_percentile_latency_us": 4920.391, "characteristics.accuracy": 56.75, "characteristics.good": 28375, "characteristics.power": 0.033206692211107586, "characteristics.power.normalized_per_core": 0.00027672243509256324, "characteristics.power.normalized_per_processor": 0.033206692211107586, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "02fa14e6a7bb8b6a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5291918, "90.00 percentile latency (ns)": 5870461, "90th percentile latency (ns)": 5870461, "95.00 percentile latency (ns)": 6176436, "97.00 percentile latency (ns)": 6885749, "99.00 percentile latency (ns)": 15932064, "99.90 percentile latency (ns)": 111159743, "Max latency (ns)": 133241757, "Mean latency (ns)": 5791754, "Min duration satisfied": "Yes", "Min latency (ns)": 4776109, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 171.31, "QPS w/o loadgen overhead": 172.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.870461, "characteristics.90th_percentile_latency_ns": 5870461.0, "characteristics.90th_percentile_latency_s": 0.005870461, "characteristics.90th_percentile_latency_us": 5870.461, "characteristics.accuracy": 57.002, "characteristics.good": 28501, "characteristics.power": 0.04134804350787073, "characteristics.power.normalized_per_core": 0.0003445670292322561, "characteristics.power.normalized_per_processor": 0.04134804350787073, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c9784b9c44d3391c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 90896977, "90.00 percentile latency (ns)": 107361194, "90th percentile latency (ns)": 107361194, "95.00 percentile latency (ns)": 112701786, "97.00 percentile latency (ns)": 118876780, "99.00 percentile latency (ns)": 201223641, "99.90 percentile latency (ns)": 229153486, "Max latency (ns)": 291484542, "Mean latency (ns)": 95689643, "Min duration satisfied": "Yes", "Min latency (ns)": 88728968, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.45, "QPS w/o loadgen overhead": 10.45, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 107.361194, "characteristics.90th_percentile_latency_ns": 107361194.0, "characteristics.90th_percentile_latency_s": 0.107361194, "characteristics.90th_percentile_latency_us": 107361.194, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.power": 0.6611264783672633, "characteristics.power.normalized_per_core": 0.0055093873197271945, "characteristics.power.normalized_per_processor": 0.6611264783672633, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.6383, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a73624a284aeb8d5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7068324, "90.00 percentile latency (ns)": 7958645, "90th percentile latency (ns)": 7958645, "95.00 percentile latency (ns)": 8328647, "97.00 percentile latency (ns)": 10416010, "99.00 percentile latency (ns)": 21582938, "99.90 percentile latency (ns)": 114972759, "Max latency (ns)": 171394386, "Mean latency (ns)": 7700767, "Min duration satisfied": "Yes", "Min latency (ns)": 6339989, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 128.91, "QPS w/o loadgen overhead": 129.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.958645, "characteristics.90th_percentile_latency_ns": 7958645.0, "characteristics.90th_percentile_latency_s": 0.007958645, "characteristics.90th_percentile_latency_us": 7958.645, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.power": 0.05235701467219018, "characteristics.power.normalized_per_core": 0.00043630845560158483, "characteristics.power.normalized_per_processor": 0.05235701467219018, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "40204d638b539a9f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40118151, "90.00 percentile latency (ns)": 45209373, "90th percentile latency (ns)": 45209373, "95.00 percentile latency (ns)": 54823567, "97.00 percentile latency (ns)": 61175261, "99.00 percentile latency (ns)": 102917821, "99.90 percentile latency (ns)": 155126058, "Max latency (ns)": 171295609, "Mean latency (ns)": 42598893, "Min duration satisfied": "Yes", "Min latency (ns)": 39543146, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.46, "QPS w/o loadgen overhead": 23.47, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 45.209373, "characteristics.90th_percentile_latency_ns": 45209373.0, "characteristics.90th_percentile_latency_s": 0.045209373, "characteristics.90th_percentile_latency_us": 45209.373, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.power": 0.2877986440254158, "characteristics.power.normalized_per_core": 0.0023983220335451316, "characteristics.power.normalized_per_processor": 0.2877986440254158, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.7273, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "34c82992d3395509", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30436141, "90.00 percentile latency (ns)": 34996891, "90th percentile latency (ns)": 34996891, "95.00 percentile latency (ns)": 43130179, "97.00 percentile latency (ns)": 50724949, "99.00 percentile latency (ns)": 91188134, "99.90 percentile latency (ns)": 113467761, "Max latency (ns)": 132999034, "Mean latency (ns)": 32546484, "Min duration satisfied": "Yes", "Min latency (ns)": 29064859, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 30.7, "QPS w/o loadgen overhead": 30.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 34.996891, "characteristics.90th_percentile_latency_ns": 34996891.0, "characteristics.90th_percentile_latency_s": 0.034996891, "characteristics.90th_percentile_latency_us": 34996.891, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.power": 0.22143114655477641, "characteristics.power.normalized_per_core": 0.0018452595546231368, "characteristics.power.normalized_per_processor": 0.22143114655477641, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 30.303, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0264548cb94b0e5b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 40736893, "90.00 percentile latency (ns)": 48067765, "90th percentile latency (ns)": 48067765, "95.00 percentile latency (ns)": 55459939, "97.00 percentile latency (ns)": 61748216, "99.00 percentile latency (ns)": 109298935, "99.90 percentile latency (ns)": 128867988, "Max latency (ns)": 140470186, "Mean latency (ns)": 43306714, "Min duration satisfied": "Yes", "Min latency (ns)": 39201922, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 23.08, "QPS w/o loadgen overhead": 23.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 48.067765, "characteristics.90th_percentile_latency_ns": 48067765.0, "characteristics.90th_percentile_latency_s": 0.048067765, "characteristics.90th_percentile_latency_us": 48067.765, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.power": 0.30223580934882877, "characteristics.power.normalized_per_core": 0.002518631744573573, "characteristics.power.normalized_per_processor": 0.30223580934882877, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 23.2558, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "564d7993f4dc6fb5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11169553, "90.00 percentile latency (ns)": 11913943, "90th percentile latency (ns)": 11913943, "95.00 percentile latency (ns)": 14217550, "97.00 percentile latency (ns)": 17421370, "99.00 percentile latency (ns)": 33687538, "99.90 percentile latency (ns)": 125136697, "Max latency (ns)": 149942103, "Mean latency (ns)": 12081537, "Min duration satisfied": "Yes", "Min latency (ns)": 10390203, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 82.3, "QPS w/o loadgen overhead": 82.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.913943, "characteristics.90th_percentile_latency_ns": 11913943.0, "characteristics.90th_percentile_latency_s": 0.011913943, "characteristics.90th_percentile_latency_us": 11913.943, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.power": 0.08241370120238738, "characteristics.power.normalized_per_core": 0.0006867808433532282, "characteristics.power.normalized_per_processor": 0.08241370120238738, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "89845bda43a5a081", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20171082, "90.00 percentile latency (ns)": 20831399, "90th percentile latency (ns)": 20831399, "95.00 percentile latency (ns)": 24433557, "97.00 percentile latency (ns)": 28657972, "99.00 percentile latency (ns)": 46377639, "99.90 percentile latency (ns)": 101352084, "Max latency (ns)": 121799189, "Mean latency (ns)": 21339308, "Min duration satisfied": "Yes", "Min latency (ns)": 19541284, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 46.81, "QPS w/o loadgen overhead": 46.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.831399, "characteristics.90th_percentile_latency_ns": 20831399.0, "characteristics.90th_percentile_latency_s": 0.020831399, "characteristics.90th_percentile_latency_us": 20831.399, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.power": 0.1392817083462421, "characteristics.power.normalized_per_core": 0.0011606809028853508, "characteristics.power.normalized_per_processor": 0.1392817083462421, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 45.4545, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2bd3c35a01e93e4c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 33786442, "90.00 percentile latency (ns)": 37775239, "90th percentile latency (ns)": 37775239, "95.00 percentile latency (ns)": 45162005, "97.00 percentile latency (ns)": 52736727, "99.00 percentile latency (ns)": 69749075, "99.90 percentile latency (ns)": 158692413, "Max latency (ns)": 171164330, "Mean latency (ns)": 36034103, "Min duration satisfied": "Yes", "Min latency (ns)": 33193956, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 27.72, "QPS w/o loadgen overhead": 27.75, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 37.775239, "characteristics.90th_percentile_latency_ns": 37775239.0, "characteristics.90th_percentile_latency_s": 0.037775239, "characteristics.90th_percentile_latency_us": 37775.239, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.power": 0.2406401902988929, "characteristics.power.normalized_per_core": 0.002005334919157441, "characteristics.power.normalized_per_processor": 0.2406401902988929, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.7778, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b790597248028393", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 31243755, "90.00 percentile latency (ns)": 32632430, "90th percentile latency (ns)": 32632430, "95.00 percentile latency (ns)": 42858433, "97.00 percentile latency (ns)": 49656051, "99.00 percentile latency (ns)": 55656361, "99.90 percentile latency (ns)": 80012654, "Max latency (ns)": 165114395, "Mean latency (ns)": 32597453, "Min duration satisfied": "Yes", "Min latency (ns)": 30387938, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 30.65, "QPS w/o loadgen overhead": 30.68, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 32.63243, "characteristics.90th_percentile_latency_ns": 32632430.0, "characteristics.90th_percentile_latency_s": 0.03263243, "characteristics.90th_percentile_latency_us": 32632.43, "characteristics.accuracy": 71.19, "characteristics.good": 35595, "characteristics.power": 0.24335515749388503, "characteristics.power.normalized_per_core": 0.0020279596457823752, "characteristics.power.normalized_per_processor": 0.24335515749388503, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 29.4118, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "441caf9cb9335e77", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 194885032, "90.00 percentile latency (ns)": 214691187, "90th percentile latency (ns)": 214691187, "95.00 percentile latency (ns)": 217338350, "97.00 percentile latency (ns)": 222163811, "99.00 percentile latency (ns)": 233445307, "99.90 percentile latency (ns)": 357887332, "Max latency (ns)": 375802409, "Mean latency (ns)": 200907135, "Min duration satisfied": "Yes", "Min latency (ns)": 192244108, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.98, "QPS w/o loadgen overhead": 4.98, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 214.691187, "characteristics.90th_percentile_latency_ns": 214691187.0, "characteristics.90th_percentile_latency_s": 0.214691187, "characteristics.90th_percentile_latency_us": 214691.187, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.power": 1.420326604860631, "characteristics.power.normalized_per_core": 0.011836055040505257, "characteristics.power.normalized_per_processor": 1.420326604860631, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.92611, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "330413f9c241d9d6", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 17558859, "90.00 percentile latency (ns)": 18065896, "90th percentile latency (ns)": 18065896, "95.00 percentile latency (ns)": 20276276, "97.00 percentile latency (ns)": 23839880, "99.00 percentile latency (ns)": 42612084, "99.90 percentile latency (ns)": 97010787, "Max latency (ns)": 125975401, "Mean latency (ns)": 18565486, "Min duration satisfied": "Yes", "Min latency (ns)": 16938003, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 53.8, "QPS w/o loadgen overhead": 53.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 18.065896, "characteristics.90th_percentile_latency_ns": 18065896.0, "characteristics.90th_percentile_latency_s": 0.018065896, "characteristics.90th_percentile_latency_us": 18065.896, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.power": 0.12051548493393745, "characteristics.power.normalized_per_core": 0.001004295707782812, "characteristics.power.normalized_per_processor": 0.12051548493393745, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 52.6316, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4f77af783500636b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 95705644, "90.00 percentile latency (ns)": 114004448, "90th percentile latency (ns)": 114004448, "95.00 percentile latency (ns)": 117178218, "97.00 percentile latency (ns)": 118700427, "99.00 percentile latency (ns)": 126629390, "99.90 percentile latency (ns)": 223167413, "Max latency (ns)": 259321589, "Mean latency (ns)": 99061728, "Min duration satisfied": "Yes", "Min latency (ns)": 94019889, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.09, "QPS w/o loadgen overhead": 10.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 114.004448, "characteristics.90th_percentile_latency_ns": 114004448.0, "characteristics.90th_percentile_latency_s": 0.114004448, "characteristics.90th_percentile_latency_us": 114004.448, "characteristics.accuracy": 76.344, "characteristics.good": 38172, "characteristics.power": 0.7444546829690445, "characteristics.power.normalized_per_core": 0.006203789024742038, "characteristics.power.normalized_per_processor": 0.7444546829690445, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 9.90099, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a14b114f54334b4b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5428940, "90.00 percentile latency (ns)": 5673163, "90th percentile latency (ns)": 5673163, "95.00 percentile latency (ns)": 5837948, "97.00 percentile latency (ns)": 7142195, "99.00 percentile latency (ns)": 14816343, "99.90 percentile latency (ns)": 106243970, "Max latency (ns)": 149225353, "Mean latency (ns)": 5806551, "Min duration satisfied": "Yes", "Min latency (ns)": 4994689, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 171.59, "QPS w/o loadgen overhead": 172.22, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.673163, "characteristics.90th_percentile_latency_ns": 5673163.0, "characteristics.90th_percentile_latency_s": 0.005673163, "characteristics.90th_percentile_latency_us": 5673.163, "characteristics.accuracy": 54.568, "characteristics.good": 27284, "characteristics.power": 0.04122763052583324, "characteristics.power.normalized_per_core": 0.000343563587715277, "characteristics.power.normalized_per_processor": 0.04122763052583324, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4bc29ca167fd9275", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9581250, "90.00 percentile latency (ns)": 9899724, "90th percentile latency (ns)": 9899724, "95.00 percentile latency (ns)": 10245564, "97.00 percentile latency (ns)": 11880315, "99.00 percentile latency (ns)": 32773540, "99.90 percentile latency (ns)": 71669844, "Max latency (ns)": 111685506, "Mean latency (ns)": 10215090, "Min duration satisfied": "Yes", "Min latency (ns)": 9221951, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 97.72, "QPS w/o loadgen overhead": 97.89, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.899724, "characteristics.90th_percentile_latency_ns": 9899724.0, "characteristics.90th_percentile_latency_s": 0.009899724, "characteristics.90th_percentile_latency_us": 9899.724, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.power": 0.06569297250978672, "characteristics.power.normalized_per_core": 0.0005474414375815559, "characteristics.power.normalized_per_processor": 0.06569297250978672, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0f6cec8469391dd9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18186561, "90.00 percentile latency (ns)": 19170551, "90th percentile latency (ns)": 19170551, "95.00 percentile latency (ns)": 25110560, "97.00 percentile latency (ns)": 30868884, "99.00 percentile latency (ns)": 44720947, "99.90 percentile latency (ns)": 95442005, "Max latency (ns)": 112225732, "Mean latency (ns)": 19555222, "Min duration satisfied": "Yes", "Min latency (ns)": 17473130, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 51.02, "QPS w/o loadgen overhead": 51.14, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.170551, "characteristics.90th_percentile_latency_ns": 19170551.0, "characteristics.90th_percentile_latency_s": 0.019170551, "characteristics.90th_percentile_latency_us": 19170.551, "characteristics.accuracy": 68.126, "characteristics.good": 34063, "characteristics.power": 0.14375752515680706, "characteristics.power.normalized_per_core": 0.0011979793763067256, "characteristics.power.normalized_per_processor": 0.14375752515680706, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7e418d874510843f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 49941974, "90.00 percentile latency (ns)": 58012647, "90th percentile latency (ns)": 58012647, "95.00 percentile latency (ns)": 68523288, "97.00 percentile latency (ns)": 72332722, "99.00 percentile latency (ns)": 126320661, "99.90 percentile latency (ns)": 172375466, "Max latency (ns)": 186073332, "Mean latency (ns)": 52911400, "Min duration satisfied": "Yes", "Min latency (ns)": 48680427, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.89, "QPS w/o loadgen overhead": 18.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 58.012647, "characteristics.90th_percentile_latency_ns": 58012647.0, "characteristics.90th_percentile_latency_s": 0.058012647, "characteristics.90th_percentile_latency_us": 58012.647, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.power": 0.3607060372038703, "characteristics.power.normalized_per_core": 0.0030058836433655856, "characteristics.power.normalized_per_processor": 0.3607060372038703, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.8679, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "baf4b0d905612f29", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28360728, "90.00 percentile latency (ns)": 30144317, "90th percentile latency (ns)": 30144317, "95.00 percentile latency (ns)": 37085774, "97.00 percentile latency (ns)": 44859676, "99.00 percentile latency (ns)": 57423473, "99.90 percentile latency (ns)": 148850934, "Max latency (ns)": 221463461, "Mean latency (ns)": 30187741, "Min duration satisfied": "Yes", "Min latency (ns)": 27848811, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 33.08, "QPS w/o loadgen overhead": 33.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 30.144317, "characteristics.90th_percentile_latency_ns": 30144317.0, "characteristics.90th_percentile_latency_s": 0.030144317, "characteristics.90th_percentile_latency_us": 30144.317, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.power": 0.19526815024393746, "characteristics.power.normalized_per_core": 0.0016272345853661455, "characteristics.power.normalized_per_processor": 0.19526815024393746, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 33.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c4226b3fb23c5d8b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10520224, "90.00 percentile latency (ns)": 11300137, "90th percentile latency (ns)": 11300137, "95.00 percentile latency (ns)": 14050039, "97.00 percentile latency (ns)": 16852219, "99.00 percentile latency (ns)": 34060704, "99.90 percentile latency (ns)": 78536010, "Max latency (ns)": 119194809, "Mean latency (ns)": 11438954, "Min duration satisfied": "Yes", "Min latency (ns)": 9978527, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 87.16, "QPS w/o loadgen overhead": 87.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.300137, "characteristics.90th_percentile_latency_ns": 11300137.0, "characteristics.90th_percentile_latency_s": 0.011300137, "characteristics.90th_percentile_latency_us": 11300.137, "characteristics.accuracy": 64.768, "characteristics.good": 32384, "characteristics.power": 0.08324192761278885, "characteristics.power.normalized_per_core": 0.0006936827301065738, "characteristics.power.normalized_per_processor": 0.08324192761278885, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c4497caafb23f805", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 45667385, "90.00 percentile latency (ns)": 51733868, "90th percentile latency (ns)": 51733868, "95.00 percentile latency (ns)": 61864988, "97.00 percentile latency (ns)": 66155137, "99.00 percentile latency (ns)": 131656764, "99.90 percentile latency (ns)": 169670518, "Max latency (ns)": 217990263, "Mean latency (ns)": 48405601, "Min duration satisfied": "Yes", "Min latency (ns)": 44853281, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.65, "QPS w/o loadgen overhead": 20.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 51.733868, "characteristics.90th_percentile_latency_ns": 51733868.0, "characteristics.90th_percentile_latency_s": 0.051733868, "characteristics.90th_percentile_latency_us": 51733.868, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.power": 0.3215425935430974, "characteristics.power.normalized_per_core": 0.0026795216128591448, "characteristics.power.normalized_per_processor": 0.3215425935430974, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20.8333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "047098ef37da311a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10200883, "90.00 percentile latency (ns)": 10921819, "90th percentile latency (ns)": 10921819, "95.00 percentile latency (ns)": 13293539, "97.00 percentile latency (ns)": 16741277, "99.00 percentile latency (ns)": 34202905, "99.90 percentile latency (ns)": 78824574, "Max latency (ns)": 121137809, "Mean latency (ns)": 11094742, "Min duration satisfied": "Yes", "Min latency (ns)": 9619988, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.88, "QPS w/o loadgen overhead": 90.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.921819, "characteristics.90th_percentile_latency_ns": 10921819.0, "characteristics.90th_percentile_latency_s": 0.010921819, "characteristics.90th_percentile_latency_us": 10921.819, "characteristics.accuracy": 64.08, "characteristics.good": 32040, "characteristics.power": 0.08080478811323247, "characteristics.power.normalized_per_core": 0.0006733732342769373, "characteristics.power.normalized_per_processor": 0.08080478811323247, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "598b4ca6a1968436", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21072097, "90.00 percentile latency (ns)": 22084574, "90th percentile latency (ns)": 22084574, "95.00 percentile latency (ns)": 25829400, "97.00 percentile latency (ns)": 31140119, "99.00 percentile latency (ns)": 47024383, "99.90 percentile latency (ns)": 139799599, "Max latency (ns)": 227827422, "Mean latency (ns)": 22479101, "Min duration satisfied": "Yes", "Min latency (ns)": 20658736, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 44.45, "QPS w/o loadgen overhead": 44.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.084574, "characteristics.90th_percentile_latency_ns": 22084574.0, "characteristics.90th_percentile_latency_s": 0.022084574, "characteristics.90th_percentile_latency_us": 22084.574, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.power": 0.1466295934695991, "characteristics.power.normalized_per_core": 0.0012219132789133258, "characteristics.power.normalized_per_processor": 0.1466295934695991, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 45.4545, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4959a135bdc8fadf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 41081995, "90.00 percentile latency (ns)": 46306662, "90th percentile latency (ns)": 46306662, "95.00 percentile latency (ns)": 56187405, "97.00 percentile latency (ns)": 62860688, "99.00 percentile latency (ns)": 97326510, "99.90 percentile latency (ns)": 157926923, "Max latency (ns)": 170274715, "Mean latency (ns)": 43605545, "Min duration satisfied": "Yes", "Min latency (ns)": 40288440, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 22.92, "QPS w/o loadgen overhead": 22.93, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 46.306662, "characteristics.90th_percentile_latency_ns": 46306662.0, "characteristics.90th_percentile_latency_s": 0.046306662, "characteristics.90th_percentile_latency_us": 46306.662, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.power": 0.2929355730075611, "characteristics.power.normalized_per_core": 0.002441129775063009, "characteristics.power.normalized_per_processor": 0.2929355730075611, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 22.2222, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "31c88665c745acaf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11350324, "90.00 percentile latency (ns)": 11610320, "90th percentile latency (ns)": 11610320, "95.00 percentile latency (ns)": 14604887, "97.00 percentile latency (ns)": 17457191, "99.00 percentile latency (ns)": 34835139, "99.90 percentile latency (ns)": 116251904, "Max latency (ns)": 204371131, "Mean latency (ns)": 12144457, "Min duration satisfied": "Yes", "Min latency (ns)": 10668918, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 82.22, "QPS w/o loadgen overhead": 82.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 11.61032, "characteristics.90th_percentile_latency_ns": 11610320.0, "characteristics.90th_percentile_latency_s": 0.01161032, "characteristics.90th_percentile_latency_us": 11610.32, "characteristics.accuracy": 64.972, "characteristics.good": 32486, "characteristics.power": 0.08743571469689901, "characteristics.power.normalized_per_core": 0.0007286309558074917, "characteristics.power.normalized_per_processor": 0.08743571469689901, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "42efa1e133db65dc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 57094427, "90.00 percentile latency (ns)": 67587200, "90th percentile latency (ns)": 67587200, "95.00 percentile latency (ns)": 76605658, "97.00 percentile latency (ns)": 80820738, "99.00 percentile latency (ns)": 163746088, "99.90 percentile latency (ns)": 187468321, "Max latency (ns)": 200837163, "Mean latency (ns)": 60624808, "Min duration satisfied": "Yes", "Min latency (ns)": 55835571, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.49, "QPS w/o loadgen overhead": 16.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 67.5872, "characteristics.90th_percentile_latency_ns": 67587200.0, "characteristics.90th_percentile_latency_s": 0.0675872, "characteristics.90th_percentile_latency_us": 67587.2, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.power": 0.4081923302403613, "characteristics.power.normalized_per_core": 0.0034016027520030107, "characteristics.power.normalized_per_processor": 0.4081923302403613, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "aa4368851b67d01f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 24660909, "90.00 percentile latency (ns)": 26152278, "90th percentile latency (ns)": 26152278, "95.00 percentile latency (ns)": 32759809, "97.00 percentile latency (ns)": 37767319, "99.00 percentile latency (ns)": 51168529, "99.90 percentile latency (ns)": 143532155, "Max latency (ns)": 185307314, "Mean latency (ns)": 26226806, "Min duration satisfied": "Yes", "Min latency (ns)": 23824070, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 38.11, "QPS w/o loadgen overhead": 38.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 26.152278, "characteristics.90th_percentile_latency_ns": 26152278.0, "characteristics.90th_percentile_latency_s": 0.026152278, "characteristics.90th_percentile_latency_us": 26152.278, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.power": 0.1758796849098767, "characteristics.power.normalized_per_core": 0.0014656640409156394, "characteristics.power.normalized_per_processor": 0.1758796849098767, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "259bf824c4a629b9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5677428, "90.00 percentile latency (ns)": 6278508, "90th percentile latency (ns)": 6278508, "95.00 percentile latency (ns)": 6644666, "97.00 percentile latency (ns)": 7868139, "99.00 percentile latency (ns)": 17144968, "99.90 percentile latency (ns)": 97800628, "Max latency (ns)": 117593777, "Mean latency (ns)": 6176324, "Min duration satisfied": "Yes", "Min latency (ns)": 5162681, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 160.38, "QPS w/o loadgen overhead": 161.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 6.278508, "characteristics.90th_percentile_latency_ns": 6278508.0, "characteristics.90th_percentile_latency_s": 0.006278508, "characteristics.90th_percentile_latency_us": 6278.508, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.power": 0.04183891705169679, "characteristics.power.normalized_per_core": 0.0003486576420974732, "characteristics.power.normalized_per_processor": 0.04183891705169679, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "380dc944b1b75ebc", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11985406, "90.00 percentile latency (ns)": 12619115, "90th percentile latency (ns)": 12619115, "95.00 percentile latency (ns)": 14531642, "97.00 percentile latency (ns)": 16826811, "99.00 percentile latency (ns)": 32102162, "99.90 percentile latency (ns)": 125998623, "Max latency (ns)": 177156942, "Mean latency (ns)": 12863058, "Min duration satisfied": "Yes", "Min latency (ns)": 11667723, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 77.65, "QPS w/o loadgen overhead": 77.74, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 12.619115, "characteristics.90th_percentile_latency_ns": 12619115.0, "characteristics.90th_percentile_latency_s": 0.012619115, "characteristics.90th_percentile_latency_us": 12619.115, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.power": 0.08366109788891272, "characteristics.power.normalized_per_core": 0.0006971758157409394, "characteristics.power.normalized_per_processor": 0.08366109788891272, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 76.9231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "d1bda118c428397e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18806541, "90.00 percentile latency (ns)": 20017454, "90th percentile latency (ns)": 20017454, "95.00 percentile latency (ns)": 26017838, "97.00 percentile latency (ns)": 32689003, "99.00 percentile latency (ns)": 48446341, "99.90 percentile latency (ns)": 92389931, "Max latency (ns)": 105565960, "Mean latency (ns)": 20231230, "Min duration satisfied": "Yes", "Min latency (ns)": 17962506, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 49.29, "QPS w/o loadgen overhead": 49.43, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 20.017454, "characteristics.90th_percentile_latency_ns": 20017454.0, "characteristics.90th_percentile_latency_s": 0.020017454, "characteristics.90th_percentile_latency_us": 20017.454, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.power": 0.13787665141632122, "characteristics.power.normalized_per_core": 0.0011489720951360102, "characteristics.power.normalized_per_processor": 0.13787665141632122, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7cfa741d39b836a7", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5031137, "90.00 percentile latency (ns)": 5700043, "90th percentile latency (ns)": 5700043, "95.00 percentile latency (ns)": 6002672, "97.00 percentile latency (ns)": 6615469, "99.00 percentile latency (ns)": 14562004, "99.90 percentile latency (ns)": 104705529, "Max latency (ns)": 150546800, "Mean latency (ns)": 5511537, "Min duration satisfied": "Yes", "Min latency (ns)": 4500721, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 179.45, "QPS w/o loadgen overhead": 181.44, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.700043, "characteristics.90th_percentile_latency_ns": 5700043.0, "characteristics.90th_percentile_latency_s": 0.005700043, "characteristics.90th_percentile_latency_us": 5700.043, "characteristics.accuracy": 55.54, "characteristics.good": 27770, "characteristics.power": 0.039286052615448104, "characteristics.power.normalized_per_core": 0.00032738377179540086, "characteristics.power.normalized_per_processor": 0.039286052615448104, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "81373d3bb846549b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16936760, "90.00 percentile latency (ns)": 17751669, "90th percentile latency (ns)": 17751669, "95.00 percentile latency (ns)": 19628879, "97.00 percentile latency (ns)": 22673302, "99.00 percentile latency (ns)": 41517817, "99.90 percentile latency (ns)": 131144415, "Max latency (ns)": 156997688, "Mean latency (ns)": 17962880, "Min duration satisfied": "Yes", "Min latency (ns)": 16243423, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 55.57, "QPS w/o loadgen overhead": 55.67, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 17.751669, "characteristics.90th_percentile_latency_ns": 17751669.0, "characteristics.90th_percentile_latency_s": 0.017751669, "characteristics.90th_percentile_latency_us": 17751.669, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.power": 0.11544556569640772, "characteristics.power.normalized_per_core": 0.0009620463808033976, "characteristics.power.normalized_per_processor": 0.11544556569640772, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 58.8235, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "20a4522b30a00431", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30763201, "90.00 percentile latency (ns)": 114446581, "90th percentile latency (ns)": 114446581, "95.00 percentile latency (ns)": 123667394, "97.00 percentile latency (ns)": 127334940, "99.00 percentile latency (ns)": 133064528, "99.90 percentile latency (ns)": 142796268, "Max latency (ns)": 149314034, "Mean latency (ns)": 48152423, "Min duration satisfied": "Yes", "Min latency (ns)": 29080283, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.74, "QPS w/o loadgen overhead": 20.77, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 114.446581, "characteristics.90th_percentile_latency_ns": 114446581.0, "characteristics.90th_percentile_latency_s": 0.114446581, "characteristics.90th_percentile_latency_us": 114446.581, "characteristics.accuracy": 68.242, "characteristics.good": 34121, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.5185, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dfbefcbaeb8954a4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 42127216, "90.00 percentile latency (ns)": 173981023, "90th percentile latency (ns)": 173981023, "95.00 percentile latency (ns)": 199796761, "97.00 percentile latency (ns)": 206145968, "99.00 percentile latency (ns)": 213969411, "99.90 percentile latency (ns)": 226714874, "Max latency (ns)": 238719068, "Mean latency (ns)": 67924614, "Min duration satisfied": "Yes", "Min latency (ns)": 37262506, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.71, "QPS w/o loadgen overhead": 14.72, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 173.981023, "characteristics.90th_percentile_latency_ns": 173981023.0, "characteristics.90th_percentile_latency_s": 0.173981023, "characteristics.90th_percentile_latency_us": 173981.023, "characteristics.accuracy": 70.738, "characteristics.good": 35369, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.2857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6eae8433c88efd6d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 346502558, "90.00 percentile latency (ns)": 424471172, "90th percentile latency (ns)": 424471172, "95.00 percentile latency (ns)": 436307405, "97.00 percentile latency (ns)": 442650029, "99.00 percentile latency (ns)": 457533679, "99.90 percentile latency (ns)": 491218165, "Max latency (ns)": 509277804, "Mean latency (ns)": 321671767, "Min duration satisfied": "Yes", "Min latency (ns)": 177371225, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.11, "QPS w/o loadgen overhead": 3.11, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 424.471172, "characteristics.90th_percentile_latency_ns": 424471172.0, "characteristics.90th_percentile_latency_s": 0.424471172, "characteristics.90th_percentile_latency_us": 424471.172, "characteristics.accuracy": 78.514, "characteristics.good": 39257, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.3557, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3e60dff2d47c5839", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13487226, "90.00 percentile latency (ns)": 22662759, "90th percentile latency (ns)": 22662759, "95.00 percentile latency (ns)": 45350185, "97.00 percentile latency (ns)": 94955439, "99.00 percentile latency (ns)": 167991168, "99.90 percentile latency (ns)": 190578391, "Max latency (ns)": 209101540, "Mean latency (ns)": 19805001, "Min duration satisfied": "Yes", "Min latency (ns)": 12924315, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 50.35, "QPS w/o loadgen overhead": 50.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 22.662759, "characteristics.90th_percentile_latency_ns": 22662759.0, "characteristics.90th_percentile_latency_s": 0.022662759, "characteristics.90th_percentile_latency_us": 22662.759, "characteristics.accuracy": 63.542, "characteristics.good": 31771, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ce64b6bc6d42a399", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10245367, "90.00 percentile latency (ns)": 109642952, "90th percentile latency (ns)": 109642952, "95.00 percentile latency (ns)": 155122254, "97.00 percentile latency (ns)": 165128160, "99.00 percentile latency (ns)": 175027872, "99.90 percentile latency (ns)": 189830877, "Max latency (ns)": 207258244, "Mean latency (ns)": 30800342, "Min duration satisfied": "Yes", "Min latency (ns)": 8441996, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 32.42, "QPS w/o loadgen overhead": 32.47, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 109.642952, "characteristics.90th_percentile_latency_ns": 109642952.0, "characteristics.90th_percentile_latency_s": 0.109642952, "characteristics.90th_percentile_latency_us": 109642.952, "characteristics.accuracy": 52.172, "characteristics.good": 26086, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 38.4615, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8a43329be594c7cd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 18168184, "90.00 percentile latency (ns)": 165790062, "90th percentile latency (ns)": 165790062, "95.00 percentile latency (ns)": 175324384, "97.00 percentile latency (ns)": 179661044, "99.00 percentile latency (ns)": 187219857, "99.90 percentile latency (ns)": 200246211, "Max latency (ns)": 214645620, "Mean latency (ns)": 55267573, "Min duration satisfied": "Yes", "Min latency (ns)": 10581360, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.08, "QPS w/o loadgen overhead": 18.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 165.790062, "characteristics.90th_percentile_latency_ns": 165790062.0, "characteristics.90th_percentile_latency_s": 0.165790062, "characteristics.90th_percentile_latency_us": 165790.062, "characteristics.accuracy": 58.402, "characteristics.good": 29201, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.3934, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "890fd4bc9b5f3ee3", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20934920, "90.00 percentile latency (ns)": 160555092, "90th percentile latency (ns)": 160555092, "95.00 percentile latency (ns)": 183010100, "97.00 percentile latency (ns)": 187815509, "99.00 percentile latency (ns)": 194947194, "99.90 percentile latency (ns)": 207713795, "Max latency (ns)": 217032535, "Mean latency (ns)": 48626198, "Min duration satisfied": "Yes", "Min latency (ns)": 19731778, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.55, "QPS w/o loadgen overhead": 20.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 160.555092, "characteristics.90th_percentile_latency_ns": 160555092.0, "characteristics.90th_percentile_latency_s": 0.160555092, "characteristics.90th_percentile_latency_us": 160555.092, "characteristics.accuracy": 60.976, "characteristics.good": 30488, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.873, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "282b6f52935fa2a9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4978728, "90.00 percentile latency (ns)": 5449470, "90th percentile latency (ns)": 5449470, "95.00 percentile latency (ns)": 6504422, "97.00 percentile latency (ns)": 9158598, "99.00 percentile latency (ns)": 62129678, "99.90 percentile latency (ns)": 98663527, "Max latency (ns)": 117833657, "Mean latency (ns)": 6111088, "Min duration satisfied": "Yes", "Min latency (ns)": 3911819, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 162.89, "QPS w/o loadgen overhead": 163.64, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.44947, "characteristics.90th_percentile_latency_ns": 5449470.0, "characteristics.90th_percentile_latency_s": 0.00544947, "characteristics.90th_percentile_latency_us": 5449.47, "characteristics.accuracy": 48.162, "characteristics.good": 24081, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "08398b21ff4d1dbb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 75170822, "90.00 percentile latency (ns)": 173412730, "90th percentile latency (ns)": 173412730, "95.00 percentile latency (ns)": 201737889, "97.00 percentile latency (ns)": 208395711, "99.00 percentile latency (ns)": 216914774, "99.90 percentile latency (ns)": 232927248, "Max latency (ns)": 246852848, "Mean latency (ns)": 91646769, "Min duration satisfied": "Yes", "Min latency (ns)": 63542968, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 10.91, "QPS w/o loadgen overhead": 10.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 173.41273, "characteristics.90th_percentile_latency_ns": 173412730.0, "characteristics.90th_percentile_latency_s": 0.17341273, "characteristics.90th_percentile_latency_us": 173412.73, "characteristics.accuracy": 75.068, "characteristics.good": 37534, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 10.8696, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e4ba3ec44917ff23", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5547229, "90.00 percentile latency (ns)": 7076455, "90th percentile latency (ns)": 7076455, "95.00 percentile latency (ns)": 15760811, "97.00 percentile latency (ns)": 42230634, "99.00 percentile latency (ns)": 90812168, "99.90 percentile latency (ns)": 102818350, "Max latency (ns)": 122846429, "Mean latency (ns)": 8415294, "Min duration satisfied": "Yes", "Min latency (ns)": 5039733, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 118.12, "QPS w/o loadgen overhead": 118.83, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.076455, "characteristics.90th_percentile_latency_ns": 7076455.0, "characteristics.90th_percentile_latency_s": 0.007076455, "characteristics.90th_percentile_latency_us": 7076.455, "characteristics.accuracy": 50.242, "characteristics.good": 25121, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6bd79408490aada2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21354090, "90.00 percentile latency (ns)": 104244588, "90th percentile latency (ns)": 104244588, "95.00 percentile latency (ns)": 107854282, "97.00 percentile latency (ns)": 109845490, "99.00 percentile latency (ns)": 113643298, "99.90 percentile latency (ns)": 121020413, "Max latency (ns)": 127683805, "Mean latency (ns)": 46115094, "Min duration satisfied": "Yes", "Min latency (ns)": 12918506, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.65, "QPS w/o loadgen overhead": 21.68, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 104.244588, "characteristics.90th_percentile_latency_ns": 104244588.0, "characteristics.90th_percentile_latency_s": 0.104244588, "characteristics.90th_percentile_latency_us": 104244.588, "characteristics.accuracy": 60.842, "characteristics.good": 30421, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.8679, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "92a655f4c5e4eee9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29894471, "90.00 percentile latency (ns)": 152025071, "90th percentile latency (ns)": 152025071, "95.00 percentile latency (ns)": 189338427, "97.00 percentile latency (ns)": 196632043, "99.00 percentile latency (ns)": 205507546, "99.90 percentile latency (ns)": 217165299, "Max latency (ns)": 230662255, "Mean latency (ns)": 54557913, "Min duration satisfied": "Yes", "Min latency (ns)": 28489104, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.31, "QPS w/o loadgen overhead": 18.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 152.025071, "characteristics.90th_percentile_latency_ns": 152025071.0, "characteristics.90th_percentile_latency_s": 0.152025071, "characteristics.90th_percentile_latency_us": 152025.071, "characteristics.accuracy": 69.016, "characteristics.good": 34508, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20.4082, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "74a29a871f0a4cef", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 58578702, "90.00 percentile latency (ns)": 137455856, "90th percentile latency (ns)": 137455856, "95.00 percentile latency (ns)": 204457149, "97.00 percentile latency (ns)": 231053265, "99.00 percentile latency (ns)": 252404368, "99.90 percentile latency (ns)": 268565715, "Max latency (ns)": 281055103, "Mean latency (ns)": 76987388, "Min duration satisfied": "Yes", "Min latency (ns)": 53485611, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.99, "QPS w/o loadgen overhead": 12.99, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 137.455856, "characteristics.90th_percentile_latency_ns": 137455856.0, "characteristics.90th_percentile_latency_s": 0.137455856, "characteristics.90th_percentile_latency_us": 137455.856, "characteristics.accuracy": 74.098, "characteristics.good": 37049, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.987, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "39fe245532491c9d", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11471829, "90.00 percentile latency (ns)": 14024784, "90th percentile latency (ns)": 14024784, "95.00 percentile latency (ns)": 25236449, "97.00 percentile latency (ns)": 40427025, "99.00 percentile latency (ns)": 137162308, "99.90 percentile latency (ns)": 186633923, "Max latency (ns)": 206164996, "Mean latency (ns)": 14801132, "Min duration satisfied": "Yes", "Min latency (ns)": 10044996, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 67.37, "QPS w/o loadgen overhead": 67.56, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.024784, "characteristics.90th_percentile_latency_ns": 14024784.0, "characteristics.90th_percentile_latency_s": 0.014024784, "characteristics.90th_percentile_latency_us": 14024.784, "characteristics.accuracy": 61.924, "characteristics.good": 30962, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "840ee8b5ac245b15", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11032608, "90.00 percentile latency (ns)": 19939450, "90th percentile latency (ns)": 19939450, "95.00 percentile latency (ns)": 59852761, "97.00 percentile latency (ns)": 91688576, "99.00 percentile latency (ns)": 106028339, "99.90 percentile latency (ns)": 116041422, "Max latency (ns)": 125118776, "Mean latency (ns)": 16536215, "Min duration satisfied": "Yes", "Min latency (ns)": 10332614, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 60.26, "QPS w/o loadgen overhead": 60.47, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.93945, "characteristics.90th_percentile_latency_ns": 19939450.0, "characteristics.90th_percentile_latency_s": 0.01993945, "characteristics.90th_percentile_latency_us": 19939.45, "characteristics.accuracy": 62.298, "characteristics.good": 31149, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9a848fc1aa6d0a04", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 5232501, "90.00 percentile latency (ns)": 5762459, "90th percentile latency (ns)": 5762459, "95.00 percentile latency (ns)": 7194251, "97.00 percentile latency (ns)": 8306668, "99.00 percentile latency (ns)": 37949630, "99.90 percentile latency (ns)": 163418483, "Max latency (ns)": 198244697, "Mean latency (ns)": 6411965, "Min duration satisfied": "Yes", "Min latency (ns)": 4496626, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 155.12, "QPS w/o loadgen overhead": 155.96, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.762459, "characteristics.90th_percentile_latency_ns": 5762459.0, "characteristics.90th_percentile_latency_s": 0.005762459, "characteristics.90th_percentile_latency_us": 5762.459, "characteristics.accuracy": 49.12, "characteristics.good": 24560, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "79e79739caf588f9", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 41458361, "90.00 percentile latency (ns)": 79052623, "90th percentile latency (ns)": 79052623, "95.00 percentile latency (ns)": 159048522, "97.00 percentile latency (ns)": 189535308, "99.00 percentile latency (ns)": 218413011, "99.90 percentile latency (ns)": 238339032, "Max latency (ns)": 247931861, "Mean latency (ns)": 55819472, "Min duration satisfied": "Yes", "Min latency (ns)": 39703533, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.9, "QPS w/o loadgen overhead": 17.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 79.052623, "characteristics.90th_percentile_latency_ns": 79052623.0, "characteristics.90th_percentile_latency_s": 0.079052623, "characteristics.90th_percentile_latency_us": 79052.623, "characteristics.accuracy": 73.584, "characteristics.good": 36792, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_140.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.1818, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6e961d54884f6182", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 29576340, "90.00 percentile latency (ns)": 60099600, "90th percentile latency (ns)": 60099600, "95.00 percentile latency (ns)": 107319235, "97.00 percentile latency (ns)": 120360805, "99.00 percentile latency (ns)": 129164664, "99.90 percentile latency (ns)": 138505799, "Max latency (ns)": 147766787, "Mean latency (ns)": 38860040, "Min duration satisfied": "Yes", "Min latency (ns)": 28503990, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 25.69, "QPS w/o loadgen overhead": 25.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 60.0996, "characteristics.90th_percentile_latency_ns": 60099600.0, "characteristics.90th_percentile_latency_s": 0.0600996, "characteristics.90th_percentile_latency_us": 60099.6, "characteristics.accuracy": 70.772, "characteristics.good": 35386, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 24.3902, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9a7b460a194b60a4", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10146803, "90.00 percentile latency (ns)": 84282123, "90th percentile latency (ns)": 84282123, "95.00 percentile latency (ns)": 90882367, "97.00 percentile latency (ns)": 94233491, "99.00 percentile latency (ns)": 99388810, "99.90 percentile latency (ns)": 108333830, "Max latency (ns)": 118658591, "Mean latency (ns)": 27389143, "Min duration satisfied": "Yes", "Min latency (ns)": 6490766, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 36.42, "QPS w/o loadgen overhead": 36.51, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 84.282123, "characteristics.90th_percentile_latency_ns": 84282123.0, "characteristics.90th_percentile_latency_s": 0.084282123, "characteristics.90th_percentile_latency_us": 84282.123, "characteristics.accuracy": 47.808, "characteristics.good": 23904, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8a6e92c04092494d", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28018971, "90.00 percentile latency (ns)": 174878028, "90th percentile latency (ns)": 174878028, "95.00 percentile latency (ns)": 183326114, "97.00 percentile latency (ns)": 187289041, "99.00 percentile latency (ns)": 193774779, "99.90 percentile latency (ns)": 202575822, "Max latency (ns)": 211701953, "Mean latency (ns)": 64713813, "Min duration satisfied": "Yes", "Min latency (ns)": 16156007, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.45, "QPS w/o loadgen overhead": 15.45, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 174.878028, "characteristics.90th_percentile_latency_ns": 174878028.0, "characteristics.90th_percentile_latency_s": 0.174878028, "characteristics.90th_percentile_latency_us": 174878.028, "characteristics.accuracy": 64.038, "characteristics.good": 32019, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0df0f594697a9e3c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13911616, "90.00 percentile latency (ns)": 92078234, "90th percentile latency (ns)": 92078234, "95.00 percentile latency (ns)": 97996148, "97.00 percentile latency (ns)": 100854522, "99.00 percentile latency (ns)": 106075310, "99.90 percentile latency (ns)": 115182054, "Max latency (ns)": 138363415, "Mean latency (ns)": 32087241, "Min duration satisfied": "Yes", "Min latency (ns)": 11596077, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 31.12, "QPS w/o loadgen overhead": 31.17, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 92.078234, "characteristics.90th_percentile_latency_ns": 92078234.0, "characteristics.90th_percentile_latency_s": 0.092078234, "characteristics.90th_percentile_latency_us": 92078.234, "characteristics.accuracy": 51.848, "characteristics.good": 25924, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5fc044ee962906db", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8726757, "90.00 percentile latency (ns)": 10012693, "90th percentile latency (ns)": 10012693, "95.00 percentile latency (ns)": 12783850, "97.00 percentile latency (ns)": 24543995, "99.00 percentile latency (ns)": 92362757, "99.90 percentile latency (ns)": 175647980, "Max latency (ns)": 198068790, "Mean latency (ns)": 10834358, "Min duration satisfied": "Yes", "Min latency (ns)": 7548407, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 91.98, "QPS w/o loadgen overhead": 92.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.012693, "characteristics.90th_percentile_latency_ns": 10012693.0, "characteristics.90th_percentile_latency_s": 0.010012693, "characteristics.90th_percentile_latency_us": 10012.693, "characteristics.accuracy": 59.226, "characteristics.good": 29613, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c8629ade48eba845", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16724480, "90.00 percentile latency (ns)": 21916435, "90th percentile latency (ns)": 21916435, "95.00 percentile latency (ns)": 40067168, "97.00 percentile latency (ns)": 64680357, "99.00 percentile latency (ns)": 106111078, "99.90 percentile latency (ns)": 120064113, "Max latency (ns)": 129921283, "Mean latency (ns)": 20477601, "Min duration satisfied": "Yes", "Min latency (ns)": 15601850, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 48.73, "QPS w/o loadgen overhead": 48.83, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.916435, "characteristics.90th_percentile_latency_ns": 21916435.0, "characteristics.90th_percentile_latency_s": 0.021916435, "characteristics.90th_percentile_latency_us": 21916.435, "characteristics.accuracy": 68.248, "characteristics.good": 34124, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 47.619, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8e8126053da005ca", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7609864, "90.00 percentile latency (ns)": 8780318, "90th percentile latency (ns)": 8780318, "95.00 percentile latency (ns)": 10817319, "97.00 percentile latency (ns)": 20330877, "99.00 percentile latency (ns)": 59454596, "99.90 percentile latency (ns)": 173430501, "Max latency (ns)": 203213816, "Mean latency (ns)": 9482643, "Min duration satisfied": "Yes", "Min latency (ns)": 6854443, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 105.02, "QPS w/o loadgen overhead": 105.46, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.780318, "characteristics.90th_percentile_latency_ns": 8780318.0, "characteristics.90th_percentile_latency_s": 0.008780318, "characteristics.90th_percentile_latency_us": 8780.318, "characteristics.accuracy": 59.12, "characteristics.good": 29560, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 100, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2d7167c211430388", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7953172, "90.00 percentile latency (ns)": 9543919, "90th percentile latency (ns)": 9543919, "95.00 percentile latency (ns)": 12537004, "97.00 percentile latency (ns)": 25609537, "99.00 percentile latency (ns)": 79335043, "99.90 percentile latency (ns)": 105626994, "Max latency (ns)": 127819786, "Mean latency (ns)": 9946099, "Min duration satisfied": "Yes", "Min latency (ns)": 7124544, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 100.13, "QPS w/o loadgen overhead": 100.54, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 9.543919, "characteristics.90th_percentile_latency_ns": 9543919.0, "characteristics.90th_percentile_latency_s": 0.009543919, "characteristics.90th_percentile_latency_us": 9543.919, "characteristics.accuracy": 58.46, "characteristics.good": 29230, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 90.9091, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dd36a384e4c9469e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28878146, "90.00 percentile latency (ns)": 43218781, "90th percentile latency (ns)": 43218781, "95.00 percentile latency (ns)": 56789712, "97.00 percentile latency (ns)": 83915530, "99.00 percentile latency (ns)": 174956463, "99.90 percentile latency (ns)": 202318243, "Max latency (ns)": 160739966122, "Mean latency (ns)": 46022134, "Min duration satisfied": "Yes", "Min latency (ns)": 27275443, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.72, "QPS w/o loadgen overhead": 21.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 43.218781, "characteristics.90th_percentile_latency_ns": 43218781.0, "characteristics.90th_percentile_latency_s": 0.043218781, "characteristics.90th_percentile_latency_us": 43218.781, "characteristics.accuracy": 72.91, "characteristics.good": 36455, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.027, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "59d35521f55a2c55", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 26462839, "90.00 percentile latency (ns)": 49678656, "90th percentile latency (ns)": 49678656, "95.00 percentile latency (ns)": 101690992, "97.00 percentile latency (ns)": 152968485, "99.00 percentile latency (ns)": 191794394, "99.90 percentile latency (ns)": 211942288, "Max latency (ns)": 228234846, "Mean latency (ns)": 36858679, "Min duration satisfied": "Yes", "Min latency (ns)": 25704804, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 27.09, "QPS w/o loadgen overhead": 27.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 49.678656, "characteristics.90th_percentile_latency_ns": 49678656.0, "characteristics.90th_percentile_latency_s": 0.049678656, "characteristics.90th_percentile_latency_us": 49678.656, "characteristics.accuracy": 70.542, "characteristics.good": 35271, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25.641, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "224e6ab14d11fe2b", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9191907, "90.00 percentile latency (ns)": 10390383, "90th percentile latency (ns)": 10390383, "95.00 percentile latency (ns)": 13079545, "97.00 percentile latency (ns)": 25384041, "99.00 percentile latency (ns)": 84731691, "99.90 percentile latency (ns)": 175553391, "Max latency (ns)": 204941029, "Mean latency (ns)": 11095756, "Min duration satisfied": "Yes", "Min latency (ns)": 7801815, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 89.86, "QPS w/o loadgen overhead": 90.12, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.390383, "characteristics.90th_percentile_latency_ns": 10390383.0, "characteristics.90th_percentile_latency_s": 0.010390383, "characteristics.90th_percentile_latency_us": 10390.383, "characteristics.accuracy": 56.594, "characteristics.good": 28297, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "94c53ba43018d9f2", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 16361052, "90.00 percentile latency (ns)": 21001183, "90th percentile latency (ns)": 21001183, "95.00 percentile latency (ns)": 38405818, "97.00 percentile latency (ns)": 62696870, "99.00 percentile latency (ns)": 155922213, "99.90 percentile latency (ns)": 196033192, "Max latency (ns)": 214988713, "Mean latency (ns)": 20832189, "Min duration satisfied": "Yes", "Min latency (ns)": 14747262, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 47.91, "QPS w/o loadgen overhead": 48.0, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.001183, "characteristics.90th_percentile_latency_ns": 21001183.0, "characteristics.90th_percentile_latency_s": 0.021001183, "characteristics.90th_percentile_latency_us": 21001.183, "characteristics.accuracy": 67.82, "characteristics.good": 33910, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 50, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "fb189f2ce4d91892", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4947828, "90.00 percentile latency (ns)": 30516176, "90th percentile latency (ns)": 30516176, "95.00 percentile latency (ns)": 64529432, "97.00 percentile latency (ns)": 76901918, "99.00 percentile latency (ns)": 87061617, "99.90 percentile latency (ns)": 99310563, "Max latency (ns)": 117784155, "Mean latency (ns)": 12001121, "Min duration satisfied": "Yes", "Min latency (ns)": 4612120, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 82.99, "QPS w/o loadgen overhead": 83.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 30.516176, "characteristics.90th_percentile_latency_ns": 30516176.0, "characteristics.90th_percentile_latency_s": 0.030516176, "characteristics.90th_percentile_latency_us": 30516.176, "characteristics.accuracy": 44.116, "characteristics.good": 22058, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a900028a6ca4ee51", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4009547, "90.00 percentile latency (ns)": 4341171, "90th percentile latency (ns)": 4341171, "95.00 percentile latency (ns)": 5397591, "97.00 percentile latency (ns)": 6144258, "99.00 percentile latency (ns)": 30616861, "99.90 percentile latency (ns)": 87587599, "Max latency (ns)": 106809644, "Mean latency (ns)": 4692802, "Min duration satisfied": "Yes", "Min latency (ns)": 3190546, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 211.72, "QPS w/o loadgen overhead": 213.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.341171, "characteristics.90th_percentile_latency_ns": 4341171.0, "characteristics.90th_percentile_latency_s": 0.004341171, "characteristics.90th_percentile_latency_us": 4341.171, "characteristics.accuracy": 45.494, "characteristics.good": 22747, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 200, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "b1515331b4264e1e", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 49632304, "90.00 percentile latency (ns)": 118952929, "90th percentile latency (ns)": 118952929, "95.00 percentile latency (ns)": 135847991, "97.00 percentile latency (ns)": 140272624, "99.00 percentile latency (ns)": 147364494, "99.90 percentile latency (ns)": 156995272, "Max latency (ns)": 183180558, "Mean latency (ns)": 62881535, "Min duration satisfied": "Yes", "Min latency (ns)": 44683289, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.89, "QPS w/o loadgen overhead": 15.9, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 118.952929, "characteristics.90th_percentile_latency_ns": 118952929.0, "characteristics.90th_percentile_latency_s": 0.118952929, "characteristics.90th_percentile_latency_us": 118952.929, "characteristics.accuracy": 70.626, "characteristics.good": 35313, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.625, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "46a58184009bc241", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11156545, "90.00 percentile latency (ns)": 13505046, "90th percentile latency (ns)": 13505046, "95.00 percentile latency (ns)": 23485296, "97.00 percentile latency (ns)": 34850675, "99.00 percentile latency (ns)": 116066748, "99.90 percentile latency (ns)": 181382611, "Max latency (ns)": 208874787, "Mean latency (ns)": 14082801, "Min duration satisfied": "Yes", "Min latency (ns)": 10117629, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 70.81, "QPS w/o loadgen overhead": 71.01, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.505046, "characteristics.90th_percentile_latency_ns": 13505046.0, "characteristics.90th_percentile_latency_s": 0.013505046, "characteristics.90th_percentile_latency_us": 13505.046, "characteristics.accuracy": 63.454, "characteristics.good": 31727, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "48484f2360ea1656", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22752264, "90.00 percentile latency (ns)": 33643121, "90th percentile latency (ns)": 33643121, "95.00 percentile latency (ns)": 53766398, "97.00 percentile latency (ns)": 85254137, "99.00 percentile latency (ns)": 114690295, "99.90 percentile latency (ns)": 126756253, "Max latency (ns)": 136000570, "Mean latency (ns)": 27371532, "Min duration satisfied": "Yes", "Min latency (ns)": 21312368, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 36.48, "QPS w/o loadgen overhead": 36.53, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.643121, "characteristics.90th_percentile_latency_ns": 33643121.0, "characteristics.90th_percentile_latency_s": 0.033643121, "characteristics.90th_percentile_latency_us": 33643.121, "characteristics.accuracy": 70.04, "characteristics.good": 35020, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 37.037, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e47e0a86d9603424", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 90416167, "90.00 percentile latency (ns)": 231711674, "90th percentile latency (ns)": 231711674, "95.00 percentile latency (ns)": 250833741, "97.00 percentile latency (ns)": 259360061, "99.00 percentile latency (ns)": 271404709, "99.90 percentile latency (ns)": 291127981, "Max latency (ns)": 300736761, "Mean latency (ns)": 126881152, "Min duration satisfied": "Yes", "Min latency (ns)": 71903148, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.88, "QPS w/o loadgen overhead": 7.88, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 231.711674, "characteristics.90th_percentile_latency_ns": 231711674.0, "characteristics.90th_percentile_latency_s": 0.231711674, "characteristics.90th_percentile_latency_us": 231711.674, "characteristics.accuracy": 74.124, "characteristics.good": 37062, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 9.25926, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3416ebe84bb9ffe8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6970839, "90.00 percentile latency (ns)": 8088215, "90th percentile latency (ns)": 8088215, "95.00 percentile latency (ns)": 9513299, "97.00 percentile latency (ns)": 20565140, "99.00 percentile latency (ns)": 74125394, "99.90 percentile latency (ns)": 102002326, "Max latency (ns)": 119584002, "Mean latency (ns)": 8611250, "Min duration satisfied": "Yes", "Min latency (ns)": 6090588, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 115.67, "QPS w/o loadgen overhead": 116.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.088215, "characteristics.90th_percentile_latency_ns": 8088215.0, "characteristics.90th_percentile_latency_s": 0.008088215, "characteristics.90th_percentile_latency_us": 8088.215, "characteristics.accuracy": 59.444, "characteristics.good": 29722, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "ed420fad9377087c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 8955641, "90.00 percentile latency (ns)": 10188527, "90th percentile latency (ns)": 10188527, "95.00 percentile latency (ns)": 14617782, "97.00 percentile latency (ns)": 29265301, "99.00 percentile latency (ns)": 86032251, "99.90 percentile latency (ns)": 107130499, "Max latency (ns)": 126045026, "Mean latency (ns)": 10929574, "Min duration satisfied": "Yes", "Min latency (ns)": 7845267, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 91.19, "QPS w/o loadgen overhead": 91.49, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.188527, "characteristics.90th_percentile_latency_ns": 10188527.0, "characteristics.90th_percentile_latency_s": 0.010188527, "characteristics.90th_percentile_latency_us": 10188.527, "characteristics.accuracy": 61.456, "characteristics.good": 30728, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c4582af196ed7e04", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10471997, "90.00 percentile latency (ns)": 14271455, "90th percentile latency (ns)": 14271455, "95.00 percentile latency (ns)": 26987981, "97.00 percentile latency (ns)": 47446276, "99.00 percentile latency (ns)": 151249767, "99.90 percentile latency (ns)": 185743703, "Max latency (ns)": 213258051, "Mean latency (ns)": 14820536, "Min duration satisfied": "Yes", "Min latency (ns)": 9934163, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 67.22, "QPS w/o loadgen overhead": 67.47, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.271455, "characteristics.90th_percentile_latency_ns": 14271455.0, "characteristics.90th_percentile_latency_s": 0.014271455, "characteristics.90th_percentile_latency_us": 14271.455, "characteristics.accuracy": 58.528, "characteristics.good": 29264, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 62.5, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "04a04624a751fd60", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 28615043, "90.00 percentile latency (ns)": 179620350, "90th percentile latency (ns)": 179620350, "95.00 percentile latency (ns)": 189009398, "97.00 percentile latency (ns)": 193102292, "99.00 percentile latency (ns)": 200601050, "99.90 percentile latency (ns)": 213657843, "Max latency (ns)": 221220459, "Mean latency (ns)": 65094858, "Min duration satisfied": "Yes", "Min latency (ns)": 19996934, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.35, "QPS w/o loadgen overhead": 15.36, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 179.62035, "characteristics.90th_percentile_latency_ns": 179620350.0, "characteristics.90th_percentile_latency_s": 0.17962035, "characteristics.90th_percentile_latency_us": 179620.35, "characteristics.accuracy": 66.036, "characteristics.good": 33018, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.1515, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7438997afd73f68f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 106589932, "90.00 percentile latency (ns)": 203312804, "90th percentile latency (ns)": 203312804, "95.00 percentile latency (ns)": 251745383, "97.00 percentile latency (ns)": 268920041, "99.00 percentile latency (ns)": 284618617, "99.90 percentile latency (ns)": 305475888, "Max latency (ns)": 324681961, "Mean latency (ns)": 124006273, "Min duration satisfied": "Yes", "Min latency (ns)": 92041550, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 8.06, "QPS w/o loadgen overhead": 8.06, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 203.312804, "characteristics.90th_percentile_latency_ns": 203312804.0, "characteristics.90th_percentile_latency_s": 0.203312804, "characteristics.90th_percentile_latency_us": 203312.804, "characteristics.accuracy": 76.642, "characteristics.good": 38321, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite1-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite1-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite1.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.69231, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a08aa0ae2a74610b", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21818130, "90.00 percentile latency (ns)": 33610496, "90th percentile latency (ns)": 33610496, "95.00 percentile latency (ns)": 58053034, "97.00 percentile latency (ns)": 108601529, "99.00 percentile latency (ns)": 178887184, "99.90 percentile latency (ns)": 203555712, "Max latency (ns)": 231779097, "Mean latency (ns)": 27950052, "Min duration satisfied": "Yes", "Min latency (ns)": 19566752, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 35.73, "QPS w/o loadgen overhead": 35.78, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 33.610496, "characteristics.90th_percentile_latency_ns": 33610496.0, "characteristics.90th_percentile_latency_s": 0.033610496, "characteristics.90th_percentile_latency_us": 33610.496, "characteristics.accuracy": 69.604, "characteristics.good": 34802, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_100.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 35.7143, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5eca40c8bebb2e58", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 45189077, "90.00 percentile latency (ns)": 122187904, "90th percentile latency (ns)": 122187904, "95.00 percentile latency (ns)": 130905815, "97.00 percentile latency (ns)": 134444035, "99.00 percentile latency (ns)": 140527160, "99.90 percentile latency (ns)": 150289542, "Max latency (ns)": 160310028, "Mean latency (ns)": 60152709, "Min duration satisfied": "Yes", "Min latency (ns)": 39931789, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.61, "QPS w/o loadgen overhead": 16.62, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 122.187904, "characteristics.90th_percentile_latency_ns": 122187904.0, "characteristics.90th_percentile_latency_s": 0.122187904, "characteristics.90th_percentile_latency_us": 122187.904, "characteristics.accuracy": 69.262, "characteristics.good": 34631, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.129, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "df4162b4020398f5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 21614571, "90.00 percentile latency (ns)": 40648506, "90th percentile latency (ns)": 40648506, "95.00 percentile latency (ns)": 84663372, "97.00 percentile latency (ns)": 137631588, "99.00 percentile latency (ns)": 184040921, "99.90 percentile latency (ns)": 202353444, "Max latency (ns)": 225901545, "Mean latency (ns)": 30785840, "Min duration satisfied": "Yes", "Min latency (ns)": 20811895, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 32.43, "QPS w/o loadgen overhead": 32.48, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 40.648506, "characteristics.90th_percentile_latency_ns": 40648506.0, "characteristics.90th_percentile_latency_s": 0.040648506, "characteristics.90th_percentile_latency_us": 40648.506, "characteristics.accuracy": 68.734, "characteristics.good": 34367, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_224_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 27.7778, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2b945828572d2c90", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 43281321, "90.00 percentile latency (ns)": 127912213, "90th percentile latency (ns)": 127912213, "95.00 percentile latency (ns)": 131969344, "97.00 percentile latency (ns)": 134249616, "99.00 percentile latency (ns)": 139825670, "99.90 percentile latency (ns)": 150726574, "Max latency (ns)": 157960418, "Mean latency (ns)": 62163370, "Min duration satisfied": "Yes", "Min latency (ns)": 15469162, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 16.08, "QPS w/o loadgen overhead": 16.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 127.912213, "characteristics.90th_percentile_latency_ns": 127912213.0, "characteristics.90th_percentile_latency_s": 0.127912213, "characteristics.90th_percentile_latency_us": 127912.213, "characteristics.accuracy": 63.33, "characteristics.good": 31665, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.1515, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "55ed4ec39bc29110", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10282142, "90.00 percentile latency (ns)": 90233335, "90th percentile latency (ns)": 90233335, "95.00 percentile latency (ns)": 97159009, "97.00 percentile latency (ns)": 99925154, "99.00 percentile latency (ns)": 104573156, "99.90 percentile latency (ns)": 111926093, "Max latency (ns)": 122452358, "Mean latency (ns)": 27068846, "Min duration satisfied": "Yes", "Min latency (ns)": 8785888, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 36.84, "QPS w/o loadgen overhead": 36.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 90.233335, "characteristics.90th_percentile_latency_ns": 90233335.0, "characteristics.90th_percentile_latency_s": 0.090233335, "characteristics.90th_percentile_latency_us": 90233.335, "characteristics.accuracy": 57.918, "characteristics.good": 28959, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9ff42e2a1c60f808", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 67743731, "90.00 percentile latency (ns)": 122530897, "90th percentile latency (ns)": 122530897, "95.00 percentile latency (ns)": 143257613, "97.00 percentile latency (ns)": 148491169, "99.00 percentile latency (ns)": 156266209, "99.90 percentile latency (ns)": 168553925, "Max latency (ns)": 176712140, "Mean latency (ns)": 76491142, "Min duration satisfied": "Yes", "Min latency (ns)": 58807686, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.07, "QPS w/o loadgen overhead": 13.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 122.530897, "characteristics.90th_percentile_latency_ns": 122530897.0, "characteristics.90th_percentile_latency_s": 0.122530897, "characteristics.90th_percentile_latency_us": 122530.897, "characteristics.accuracy": 71.676, "characteristics.good": 35838, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.987, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f87f9148429d1c65", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 3745872, "90.00 percentile latency (ns)": 4090914, "90th percentile latency (ns)": 4090914, "95.00 percentile latency (ns)": 4971455, "97.00 percentile latency (ns)": 5926953, "99.00 percentile latency (ns)": 23751563, "99.90 percentile latency (ns)": 120678713, "Max latency (ns)": 178539681, "Mean latency (ns)": 4456605, "Min duration satisfied": "Yes", "Min latency (ns)": 3191414, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 222.63, "QPS w/o loadgen overhead": 224.39, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 4.090914, "characteristics.90th_percentile_latency_ns": 4090914.0, "characteristics.90th_percentile_latency_s": 0.004090914, "characteristics.90th_percentile_latency_us": 4090.914, "characteristics.accuracy": 43.468, "characteristics.good": 21734, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4f451bb856fc2808", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 503220677, "90.00 percentile latency (ns)": 554081097, "90th percentile latency (ns)": 554081097, "95.00 percentile latency (ns)": 564939845, "97.00 percentile latency (ns)": 570244085, "99.00 percentile latency (ns)": 581902871, "99.90 percentile latency (ns)": 593908142, "Max latency (ns)": 600536536, "Mean latency (ns)": 497972933, "Min duration satisfied": "Yes", "Min latency (ns)": 318925265, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.01, "QPS w/o loadgen overhead": 2.01, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 554.081097, "characteristics.90th_percentile_latency_ns": 554081097.0, "characteristics.90th_percentile_latency_s": 0.554081097, "characteristics.90th_percentile_latency_us": 554081.097, "characteristics.accuracy": 80.676, "characteristics.good": 40338, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite4-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite4-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite4.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.04082, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "02880a45438743e0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20270503, "90.00 percentile latency (ns)": 42403287, "90th percentile latency (ns)": 42403287, "95.00 percentile latency (ns)": 107251446, "97.00 percentile latency (ns)": 151866323, "99.00 percentile latency (ns)": 177106781, "99.90 percentile latency (ns)": 190038715, "Max latency (ns)": 202797795, "Mean latency (ns)": 30389721, "Min duration satisfied": "Yes", "Min latency (ns)": 19264839, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 32.85, "QPS w/o loadgen overhead": 32.91, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 42.403287, "characteristics.90th_percentile_latency_ns": 42403287.0, "characteristics.90th_percentile_latency_s": 0.042403287, "characteristics.90th_percentile_latency_us": 42403.287, "characteristics.accuracy": 70.43, "characteristics.good": 35215, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 31.25, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "8c46074e05abed5c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 17485440, "90.00 percentile latency (ns)": 23685421, "90th percentile latency (ns)": 23685421, "95.00 percentile latency (ns)": 42668252, "97.00 percentile latency (ns)": 74788779, "99.00 percentile latency (ns)": 166965010, "99.90 percentile latency (ns)": 198888353, "Max latency (ns)": 226422449, "Mean latency (ns)": 22438926, "Min duration satisfied": "Yes", "Min latency (ns)": 15654939, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 44.48, "QPS w/o loadgen overhead": 44.57, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 23.685421, "characteristics.90th_percentile_latency_ns": 23685421.0, "characteristics.90th_percentile_latency_s": 0.023685421, "characteristics.90th_percentile_latency_us": 23685.421, "characteristics.accuracy": 67.474, "characteristics.good": 33737, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_192_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 40, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "092443a9592500cb", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 14686292, "90.00 percentile latency (ns)": 19512204, "90th percentile latency (ns)": 19512204, "95.00 percentile latency (ns)": 39265919, "97.00 percentile latency (ns)": 72863289, "99.00 percentile latency (ns)": 106072431, "99.90 percentile latency (ns)": 120435576, "Max latency (ns)": 136243646, "Mean latency (ns)": 18624130, "Min duration satisfied": "Yes", "Min latency (ns)": 13508544, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 53.57, "QPS w/o loadgen overhead": 53.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 19.512204, "characteristics.90th_percentile_latency_ns": 19512204.0, "characteristics.90th_percentile_latency_s": 0.019512204, "characteristics.90th_percentile_latency_us": 19512.204, "characteristics.accuracy": 67.24, "characteristics.good": 33620, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-192-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-192-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_192_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 55.5556, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f4544906e7907b2a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 35300165, "90.00 percentile latency (ns)": 115702354, "90th percentile latency (ns)": 115702354, "95.00 percentile latency (ns)": 119589031, "97.00 percentile latency (ns)": 122172321, "99.00 percentile latency (ns)": 126745348, "99.90 percentile latency (ns)": 134645929, "Max latency (ns)": 141075289, "Mean latency (ns)": 56934882, "Min duration satisfied": "Yes", "Min latency (ns)": 23172888, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.54, "QPS w/o loadgen overhead": 17.56, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 115.702354, "characteristics.90th_percentile_latency_ns": 115702354.0, "characteristics.90th_percentile_latency_s": 0.115702354, "characteristics.90th_percentile_latency_us": 115702.354, "characteristics.accuracy": 64.348, "characteristics.good": 32174, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.6582, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "12ff9bd41ec93719", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 36138644, "90.00 percentile latency (ns)": 110737599, "90th percentile latency (ns)": 110737599, "95.00 percentile latency (ns)": 114342512, "97.00 percentile latency (ns)": 116566262, "99.00 percentile latency (ns)": 121046175, "99.90 percentile latency (ns)": 126537171, "Max latency (ns)": 132045668, "Mean latency (ns)": 55469790, "Min duration satisfied": "Yes", "Min latency (ns)": 17048489, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.0, "QPS w/o loadgen overhead": 18.03, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 110.737599, "characteristics.90th_percentile_latency_ns": 110737599.0, "characteristics.90th_percentile_latency_s": 0.110737599, "characteristics.90th_percentile_latency_us": 110737.599, "characteristics.accuracy": 63.246, "characteristics.good": 31623, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "dbf4fe0ae43a3cf2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20549698, "90.00 percentile latency (ns)": 169187225, "90th percentile latency (ns)": 169187225, "95.00 percentile latency (ns)": 179325087, "97.00 percentile latency (ns)": 184369585, "99.00 percentile latency (ns)": 191780568, "99.90 percentile latency (ns)": 205226531, "Max latency (ns)": 220824785, "Mean latency (ns)": 57280459, "Min duration satisfied": "Yes", "Min latency (ns)": 14240071, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.44, "QPS w/o loadgen overhead": 17.46, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 169.187225, "characteristics.90th_percentile_latency_ns": 169187225.0, "characteristics.90th_percentile_latency_s": 0.169187225, "characteristics.90th_percentile_latency_us": 169187.225, "characteristics.accuracy": 61.668, "characteristics.good": 30834, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.9254, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6272d435293cdc6e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 27665774, "90.00 percentile latency (ns)": 113300778, "90th percentile latency (ns)": 113300778, "95.00 percentile latency (ns)": 117596512, "97.00 percentile latency (ns)": 120170384, "99.00 percentile latency (ns)": 124628798, "99.90 percentile latency (ns)": 132271001, "Max latency (ns)": 139730455, "Mean latency (ns)": 49407957, "Min duration satisfied": "Yes", "Min latency (ns)": 22991778, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.21, "QPS w/o loadgen overhead": 20.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 113.300778, "characteristics.90th_percentile_latency_ns": 113300778.0, "characteristics.90th_percentile_latency_s": 0.113300778, "characteristics.90th_percentile_latency_us": 113300.778, "characteristics.accuracy": 66.384, "characteristics.good": 33192, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "7b5c749479aaf4c9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4635157, "90.00 percentile latency (ns)": 5126905, "90th percentile latency (ns)": 5126905, "95.00 percentile latency (ns)": 6362987, "97.00 percentile latency (ns)": 7819274, "99.00 percentile latency (ns)": 32775392, "99.90 percentile latency (ns)": 148147406, "Max latency (ns)": 181068610, "Mean latency (ns)": 5721086, "Min duration satisfied": "Yes", "Min latency (ns)": 4075741, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 173.72, "QPS w/o loadgen overhead": 174.79, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.126905, "characteristics.90th_percentile_latency_ns": 5126905.0, "characteristics.90th_percentile_latency_s": 0.005126905, "characteristics.90th_percentile_latency_us": 5126.905, "characteristics.accuracy": 49.11, "characteristics.good": 24555, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 166.667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "43fb8754568fdbfd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9379979, "90.00 percentile latency (ns)": 10810885, "90th percentile latency (ns)": 10810885, "95.00 percentile latency (ns)": 16302379, "97.00 percentile latency (ns)": 29543437, "99.00 percentile latency (ns)": 105018102, "99.90 percentile latency (ns)": 179386278, "Max latency (ns)": 213687008, "Mean latency (ns)": 11901342, "Min duration satisfied": "Yes", "Min latency (ns)": 8385109, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 83.74, "QPS w/o loadgen overhead": 84.02, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 10.810885, "characteristics.90th_percentile_latency_ns": 10810885.0, "characteristics.90th_percentile_latency_s": 0.010810885, "characteristics.90th_percentile_latency_us": 10810.885, "characteristics.accuracy": 62.07, "characteristics.good": 31035, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 83.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "0702459e930a1e8f", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 22627786, "90.00 percentile latency (ns)": 168853453, "90th percentile latency (ns)": 168853453, "95.00 percentile latency (ns)": 178868239, "97.00 percentile latency (ns)": 182668829, "99.00 percentile latency (ns)": 188494870, "99.90 percentile latency (ns)": 197519533, "Max latency (ns)": 203509281, "Mean latency (ns)": 56647477, "Min duration satisfied": "Yes", "Min latency (ns)": 14391705, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.64, "QPS w/o loadgen overhead": 17.65, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 168.853453, "characteristics.90th_percentile_latency_ns": 168853453.0, "characteristics.90th_percentile_latency_s": 0.168853453, "characteristics.90th_percentile_latency_us": 168853.453, "characteristics.accuracy": 61.224, "characteristics.good": 30612, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.0845, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6ac59c6a8674a6ba", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 2749544, "90.00 percentile latency (ns)": 3015543, "90th percentile latency (ns)": 3015543, "95.00 percentile latency (ns)": 3563294, "97.00 percentile latency (ns)": 4429836, "99.00 percentile latency (ns)": 16291178, "99.90 percentile latency (ns)": 83361023, "Max latency (ns)": 106095271, "Mean latency (ns)": 3233656, "Min duration satisfied": "Yes", "Min latency (ns)": 2188960, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 306.51, "QPS w/o loadgen overhead": 309.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 3.015543, "characteristics.90th_percentile_latency_ns": 3015543.0, "characteristics.90th_percentile_latency_s": 0.003015543, "characteristics.90th_percentile_latency_us": 3015.543, "characteristics.accuracy": 42.384, "characteristics.good": 21192, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 250, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5049fd3f20744764", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 96113123, "90.00 percentile latency (ns)": 228931011, "90th percentile latency (ns)": 228931011, "95.00 percentile latency (ns)": 239924777, "97.00 percentile latency (ns)": 245077423, "99.00 percentile latency (ns)": 253878340, "99.90 percentile latency (ns)": 271382449, "Max latency (ns)": 284135526, "Mean latency (ns)": 125464985, "Min duration satisfied": "Yes", "Min latency (ns)": 75414155, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.97, "QPS w/o loadgen overhead": 7.97, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 228.931011, "characteristics.90th_percentile_latency_ns": 228931011.0, "characteristics.90th_percentile_latency_s": 0.228931011, "characteristics.90th_percentile_latency_us": 228931.011, "characteristics.accuracy": 75.012, "characteristics.good": 37506, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.3-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.3-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.3_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.46269, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6490e46c1e2b2db2", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 12036802, "90.00 percentile latency (ns)": 21483019, "90th percentile latency (ns)": 21483019, "95.00 percentile latency (ns)": 44875567, "97.00 percentile latency (ns)": 92256143, "99.00 percentile latency (ns)": 122513130, "99.90 percentile latency (ns)": 136257003, "Max latency (ns)": 144366340, "Mean latency (ns)": 17455047, "Min duration satisfied": "Yes", "Min latency (ns)": 11346125, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.24, "QPS w/o loadgen overhead": 57.29, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 21.483019, "characteristics.90th_percentile_latency_ns": 21483019.0, "characteristics.90th_percentile_latency_s": 0.021483019, "characteristics.90th_percentile_latency_us": 21483.019, "characteristics.accuracy": 64.486, "characteristics.good": 32243, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_uint8", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_uint8", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_uint8.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "fc6c704b40977efc", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 243848970, "90.00 percentile latency (ns)": 298329335, "90th percentile latency (ns)": 298329335, "95.00 percentile latency (ns)": 307291037, "97.00 percentile latency (ns)": 312102970, "99.00 percentile latency (ns)": 321092681, "99.90 percentile latency (ns)": 332047095, "Max latency (ns)": 338177891, "Mean latency (ns)": 231050807, "Min duration satisfied": "Yes", "Min latency (ns)": 122919508, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 4.33, "QPS w/o loadgen overhead": 4.33, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 298.329335, "characteristics.90th_percentile_latency_ns": 298329335.0, "characteristics.90th_percentile_latency_s": 0.298329335, "characteristics.90th_percentile_latency_us": 298329.335, "characteristics.accuracy": 77.542, "characteristics.good": 38771, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite2-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite2-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite2.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 4.1841, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c4147916a5908fc5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 4827073, "90.00 percentile latency (ns)": 5459405, "90th percentile latency (ns)": 5459405, "95.00 percentile latency (ns)": 6798152, "97.00 percentile latency (ns)": 8920026, "99.00 percentile latency (ns)": 53805415, "99.90 percentile latency (ns)": 97786919, "Max latency (ns)": 117296512, "Mean latency (ns)": 6009059, "Min duration satisfied": "Yes", "Min latency (ns)": 4177826, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 165.42, "QPS w/o loadgen overhead": 166.42, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 5.459405, "characteristics.90th_percentile_latency_ns": 5459405.0, "characteristics.90th_percentile_latency_s": 0.005459405, "characteristics.90th_percentile_latency_us": 5459.405, "characteristics.accuracy": 56.75, "characteristics.good": 28375, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.5_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 142.857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "df10c4f5b957bc0c", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6483459, "90.00 percentile latency (ns)": 7583042, "90th percentile latency (ns)": 7583042, "95.00 percentile latency (ns)": 9293376, "97.00 percentile latency (ns)": 17840335, "99.00 percentile latency (ns)": 63090131, "99.90 percentile latency (ns)": 165986641, "Max latency (ns)": 192259104, "Mean latency (ns)": 8328760, "Min duration satisfied": "Yes", "Min latency (ns)": 5775876, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 119.54, "QPS w/o loadgen overhead": 120.07, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.583042, "characteristics.90th_percentile_latency_ns": 7583042.0, "characteristics.90th_percentile_latency_s": 0.007583042, "characteristics.90th_percentile_latency_us": 7583.042, "characteristics.accuracy": 57.002, "characteristics.good": 28501, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_96_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "bc5b7e3aa297ae00", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 99125647, "90.00 percentile latency (ns)": 232380799, "90th percentile latency (ns)": 232380799, "95.00 percentile latency (ns)": 244867161, "97.00 percentile latency (ns)": 249835240, "99.00 percentile latency (ns)": 259635698, "99.90 percentile latency (ns)": 279420711, "Max latency (ns)": 289281524, "Mean latency (ns)": 127163377, "Min duration satisfied": "Yes", "Min latency (ns)": 80729326, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 7.86, "QPS w/o loadgen overhead": 7.86, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 232.380799, "characteristics.90th_percentile_latency_ns": 232380799.0, "characteristics.90th_percentile_latency_s": 0.232380799, "characteristics.90th_percentile_latency_us": 232380.799, "characteristics.accuracy": 75.69, "characteristics.good": 37845, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.4-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.4-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.4_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 7.8125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "01a847a4bdc23882", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11721238, "90.00 percentile latency (ns)": 111787400, "90th percentile latency (ns)": 111787400, "95.00 percentile latency (ns)": 147639398, "97.00 percentile latency (ns)": 157290146, "99.00 percentile latency (ns)": 167054418, "99.90 percentile latency (ns)": 182406889, "Max latency (ns)": 192920314, "Mean latency (ns)": 37716950, "Min duration satisfied": "Yes", "Min latency (ns)": 7497604, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 26.48, "QPS w/o loadgen overhead": 26.51, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 111.7874, "characteristics.90th_percentile_latency_ns": 111787400.0, "characteristics.90th_percentile_latency_s": 0.1117874, "characteristics.90th_percentile_latency_us": 111787.4, "characteristics.accuracy": 52.446, "characteristics.good": 26223, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 23.2558, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "9c73b5ba7368413f", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 43988211, "90.00 percentile latency (ns)": 178022175, "90th percentile latency (ns)": 178022175, "95.00 percentile latency (ns)": 188232770, "97.00 percentile latency (ns)": 192904211, "99.00 percentile latency (ns)": 199172376, "99.90 percentile latency (ns)": 210536332, "Max latency (ns)": 230974525, "Mean latency (ns)": 72854307, "Min duration satisfied": "Yes", "Min latency (ns)": 36749680, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.72, "QPS w/o loadgen overhead": 13.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 178.022175, "characteristics.90th_percentile_latency_ns": 178022175.0, "characteristics.90th_percentile_latency_s": 0.178022175, "characteristics.90th_percentile_latency_us": 178022.175, "characteristics.accuracy": 73.724, "characteristics.good": 36862, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 12.0482, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c8a5464fe19037ff", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 33457731, "90.00 percentile latency (ns)": 115689280, "90th percentile latency (ns)": 115689280, "95.00 percentile latency (ns)": 120235867, "97.00 percentile latency (ns)": 122501329, "99.00 percentile latency (ns)": 126515372, "99.90 percentile latency (ns)": 133160611, "Max latency (ns)": 150520983, "Mean latency (ns)": 55294256, "Min duration satisfied": "Yes", "Min latency (ns)": 24161973, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.06, "QPS w/o loadgen overhead": 18.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 115.68928, "characteristics.90th_percentile_latency_ns": 115689280.0, "characteristics.90th_percentile_latency_s": 0.11568928, "characteristics.90th_percentile_latency_us": 115689.28, "characteristics.accuracy": 66.604, "characteristics.good": 33302, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.873, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "74c14bcb09fb8703", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 38755458, "90.00 percentile latency (ns)": 121937577, "90th percentile latency (ns)": 121937577, "95.00 percentile latency (ns)": 128653195, "97.00 percentile latency (ns)": 132230979, "99.00 percentile latency (ns)": 137968642, "99.90 percentile latency (ns)": 146885468, "Max latency (ns)": 152673921, "Mean latency (ns)": 58018478, "Min duration satisfied": "Yes", "Min latency (ns)": 34360921, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.22, "QPS w/o loadgen overhead": 17.24, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 121.937577, "characteristics.90th_percentile_latency_ns": 121937577.0, "characteristics.90th_percentile_latency_s": 0.121937577, "characteristics.90th_percentile_latency_us": 121937.577, "characteristics.accuracy": 69.106, "characteristics.good": 34553, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 16.9492, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4718a60db9bf8e43", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19350035, "90.00 percentile latency (ns)": 160373772, "90th percentile latency (ns)": 160373772, "95.00 percentile latency (ns)": 172283924, "97.00 percentile latency (ns)": 177124693, "99.00 percentile latency (ns)": 185596817, "99.90 percentile latency (ns)": 197655133, "Max latency (ns)": 206874427, "Mean latency (ns)": 51139182, "Min duration satisfied": "Yes", "Min latency (ns)": 11498079, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.53, "QPS w/o loadgen overhead": 19.55, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 160.373772, "characteristics.90th_percentile_latency_ns": 160373772.0, "characteristics.90th_percentile_latency_s": 0.160373772, "characteristics.90th_percentile_latency_us": 160373.772, "characteristics.accuracy": 59.822, "characteristics.good": 29911, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.7059, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5402e45f998d10ac", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20383798, "90.00 percentile latency (ns)": 123877189, "90th percentile latency (ns)": 123877189, "95.00 percentile latency (ns)": 133162654, "97.00 percentile latency (ns)": 136264384, "99.00 percentile latency (ns)": 141942488, "99.90 percentile latency (ns)": 150222066, "Max latency (ns)": 173610610, "Mean latency (ns)": 40443163, "Min duration satisfied": "Yes", "Min latency (ns)": 19249502, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 24.72, "QPS w/o loadgen overhead": 24.73, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 123.877189, "characteristics.90th_percentile_latency_ns": 123877189.0, "characteristics.90th_percentile_latency_s": 0.123877189, "characteristics.90th_percentile_latency_us": 123877.189, "characteristics.accuracy": 68.336, "characteristics.good": 34168, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 19.6078, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "00e4d9890b38eeb9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 32196498, "90.00 percentile latency (ns)": 160903694, "90th percentile latency (ns)": 160903694, "95.00 percentile latency (ns)": 188515520, "97.00 percentile latency (ns)": 194370447, "99.00 percentile latency (ns)": 202270529, "99.90 percentile latency (ns)": 216298568, "Max latency (ns)": 237935194, "Mean latency (ns)": 58375633, "Min duration satisfied": "Yes", "Min latency (ns)": 29733663, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 17.12, "QPS w/o loadgen overhead": 17.13, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 160.903694, "characteristics.90th_percentile_latency_ns": 160903694.0, "characteristics.90th_percentile_latency_s": 0.160903694, "characteristics.90th_percentile_latency_us": 160903.694, "characteristics.accuracy": 68.834, "characteristics.good": 34417, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.8889, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "aca81543f4e549e4", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 37749101, "90.00 percentile latency (ns)": 87996361, "90th percentile latency (ns)": 87996361, "95.00 percentile latency (ns)": 151407989, "97.00 percentile latency (ns)": 175164273, "99.00 percentile latency (ns)": 192469186, "99.90 percentile latency (ns)": 202696471, "Max latency (ns)": 210160995, "Mean latency (ns)": 51705064, "Min duration satisfied": "Yes", "Min latency (ns)": 34763554, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 19.32, "QPS w/o loadgen overhead": 19.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 87.996361, "characteristics.90th_percentile_latency_ns": 87996361.0, "characteristics.90th_percentile_latency_s": 0.087996361, "characteristics.90th_percentile_latency_us": 87996.361, "characteristics.accuracy": 71.19, "characteristics.good": 35595, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite0-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite0-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite0.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.5185, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "79c2eb0a44534aea", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 338680809, "90.00 percentile latency (ns)": 384612403, "90th percentile latency (ns)": 384612403, "95.00 percentile latency (ns)": 394515685, "97.00 percentile latency (ns)": 399255809, "99.00 percentile latency (ns)": 408530941, "99.90 percentile latency (ns)": 430439075, "Max latency (ns)": 435983293, "Mean latency (ns)": 330610900, "Min duration satisfied": "Yes", "Min latency (ns)": 183702418, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 3.02, "QPS w/o loadgen overhead": 3.02, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 384.612403, "characteristics.90th_percentile_latency_ns": 384612403.0, "characteristics.90th_percentile_latency_s": 0.384612403, "characteristics.90th_percentile_latency_us": 384612.403, "characteristics.accuracy": 79.268, "characteristics.good": 39634, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 3.0581, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "2d1201ddd5242e2a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 24694538, "90.00 percentile latency (ns)": 129951774, "90th percentile latency (ns)": 129951774, "95.00 percentile latency (ns)": 134376796, "97.00 percentile latency (ns)": 136962849, "99.00 percentile latency (ns)": 142270004, "99.90 percentile latency (ns)": 151067955, "Max latency (ns)": 163389164, "Mean latency (ns)": 55418062, "Min duration satisfied": "Yes", "Min latency (ns)": 16776661, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.04, "QPS w/o loadgen overhead": 18.04, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 129.951774, "characteristics.90th_percentile_latency_ns": 129951774.0, "characteristics.90th_percentile_latency_s": 0.129951774, "characteristics.90th_percentile_latency_us": 129951.774, "characteristics.accuracy": 66.216, "characteristics.good": 33108, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-small_224_0.75_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-small_224_0.75_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-small_224_0.75_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.3846, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "084cd6bf9b29003e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 127614923, "90.00 percentile latency (ns)": 295375440, "90th percentile latency (ns)": 295375440, "95.00 percentile latency (ns)": 312290088, "97.00 percentile latency (ns)": 320011379, "99.00 percentile latency (ns)": 331350400, "99.90 percentile latency (ns)": 355252532, "Max latency (ns)": 374912734, "Mean latency (ns)": 171502423, "Min duration satisfied": "Yes", "Min latency (ns)": 104126544, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 5.83, "QPS w/o loadgen overhead": 5.83, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 295.37544, "characteristics.90th_percentile_latency_ns": 295375440.0, "characteristics.90th_percentile_latency_s": 0.29537544, "characteristics.90th_percentile_latency_us": 295375.44, "characteristics.accuracy": 76.344, "characteristics.good": 38172, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "efficientnet-lite3-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "efficientnet-lite3-quantized", "input_data_types": "uint8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/lite/efficientnet-lite3.tar.gz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 6.09756, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "435abd5ddb58f5c6", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 7052199, "90.00 percentile latency (ns)": 8092319, "90th percentile latency (ns)": 8092319, "95.00 percentile latency (ns)": 9371529, "97.00 percentile latency (ns)": 14645439, "99.00 percentile latency (ns)": 54385800, "99.90 percentile latency (ns)": 166369944, "Max latency (ns)": 200222067, "Mean latency (ns)": 8549616, "Min duration satisfied": "Yes", "Min latency (ns)": 6038076, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 116.51, "QPS w/o loadgen overhead": 116.96, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 8.092319, "characteristics.90th_percentile_latency_ns": 8092319.0, "characteristics.90th_percentile_latency_s": 0.008092319, "characteristics.90th_percentile_latency_us": 8092.319, "characteristics.accuracy": 54.568, "characteristics.good": 27284, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_35.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "165e83836949da99", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 9389939, "90.00 percentile latency (ns)": 27312014, "90th percentile latency (ns)": 27312014, "95.00 percentile latency (ns)": 66791822, "97.00 percentile latency (ns)": 84217551, "99.00 percentile latency (ns)": 95790576, "99.90 percentile latency (ns)": 107371284, "Max latency (ns)": 122592144, "Mean latency (ns)": 15805190, "Min duration satisfied": "Yes", "Min latency (ns)": 8632484, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 63.05, "QPS w/o loadgen overhead": 63.27, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 27.312014, "characteristics.90th_percentile_latency_ns": 27312014.0, "characteristics.90th_percentile_latency_s": 0.027312014, "characteristics.90th_percentile_latency_us": 27312.014, "characteristics.accuracy": 49.478, "characteristics.good": 24739, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.25-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.25-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.25_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "90a357582f5a2241", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 19217346, "90.00 percentile latency (ns)": 56041496, "90th percentile latency (ns)": 56041496, "95.00 percentile latency (ns)": 101080360, "97.00 percentile latency (ns)": 109438950, "99.00 percentile latency (ns)": 116642578, "99.90 percentile latency (ns)": 126036876, "Max latency (ns)": 136443214, "Mean latency (ns)": 28739025, "Min duration satisfied": "Yes", "Min latency (ns)": 18543304, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 34.71, "QPS w/o loadgen overhead": 34.8, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 56.041496, "characteristics.90th_percentile_latency_ns": 56041496.0, "characteristics.90th_percentile_latency_s": 0.056041496, "characteristics.90th_percentile_latency_us": 56041.496, "characteristics.accuracy": 68.126, "characteristics.good": 34063, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-224-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-224-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_224_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 43.4783, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "f823e461ec34334a", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 51468921, "90.00 percentile latency (ns)": 185910559, "90th percentile latency (ns)": 185910559, "95.00 percentile latency (ns)": 200095258, "97.00 percentile latency (ns)": 204715220, "99.00 percentile latency (ns)": 213693040, "99.90 percentile latency (ns)": 223655815, "Max latency (ns)": 236151031, "Mean latency (ns)": 83477230, "Min duration satisfied": "Yes", "Min latency (ns)": 46050639, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 11.98, "QPS w/o loadgen overhead": 11.98, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 185.910559, "characteristics.90th_percentile_latency_ns": 185910559.0, "characteristics.90th_percentile_latency_s": 0.185910559, "characteristics.90th_percentile_latency_us": 185910.559, "characteristics.accuracy": 75.76, "characteristics.good": 37880, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.3333, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "3181a73c7497abf8", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 42534055, "90.00 percentile latency (ns)": 186664897, "90th percentile latency (ns)": 186664897, "95.00 percentile latency (ns)": 193130920, "97.00 percentile latency (ns)": 197007772, "99.00 percentile latency (ns)": 203216855, "99.90 percentile latency (ns)": 214667317, "Max latency (ns)": 226096280, "Mean latency (ns)": 78798543, "Min duration satisfied": "Yes", "Min latency (ns)": 25397175, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.68, "QPS w/o loadgen overhead": 12.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 186.664897, "characteristics.90th_percentile_latency_ns": 186664897.0, "characteristics.90th_percentile_latency_s": 0.186664897, "characteristics.90th_percentile_latency_us": 186664.897, "characteristics.accuracy": 65.75, "characteristics.good": 32875, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.2857, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "93aa78bc751a361e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11468668, "90.00 percentile latency (ns)": 14440978, "90th percentile latency (ns)": 14440978, "95.00 percentile latency (ns)": 24735630, "97.00 percentile latency (ns)": 41381753, "99.00 percentile latency (ns)": 93226260, "99.90 percentile latency (ns)": 111032272, "Max latency (ns)": 121044296, "Mean latency (ns)": 14277895, "Min duration satisfied": "Yes", "Min latency (ns)": 10718798, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 69.84, "QPS w/o loadgen overhead": 70.04, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 14.440978, "characteristics.90th_percentile_latency_ns": 14440978.0, "characteristics.90th_percentile_latency_s": 0.014440978, "characteristics.90th_percentile_latency_us": 14440.978, "characteristics.accuracy": 64.768, "characteristics.good": 32384, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-1.0-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-1.0-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_1.0_128_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "30355c9484ebbda8", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 46440958, "90.00 percentile latency (ns)": 169783095, "90th percentile latency (ns)": 169783095, "95.00 percentile latency (ns)": 198553376, "97.00 percentile latency (ns)": 205144817, "99.00 percentile latency (ns)": 212489210, "99.90 percentile latency (ns)": 225700565, "Max latency (ns)": 238968028, "Mean latency (ns)": 69951840, "Min duration satisfied": "Yes", "Min latency (ns)": 40195358, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 14.29, "QPS w/o loadgen overhead": 14.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 169.783095, "characteristics.90th_percentile_latency_ns": 169783095.0, "characteristics.90th_percentile_latency_s": 0.169783095, "characteristics.90th_percentile_latency_us": 169783.095, "characteristics.accuracy": 70.122, "characteristics.good": 35061, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 14.7059, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "47b89d3f7f7b547c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 11225102, "90.00 percentile latency (ns)": 13882770, "90th percentile latency (ns)": 13882770, "95.00 percentile latency (ns)": 23419365, "97.00 percentile latency (ns)": 37345636, "99.00 percentile latency (ns)": 90020162, "99.90 percentile latency (ns)": 110272613, "Max latency (ns)": 129847445, "Mean latency (ns)": 13763619, "Min duration satisfied": "Yes", "Min latency (ns)": 10297306, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 72.46, "QPS w/o loadgen overhead": 72.66, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 13.88277, "characteristics.90th_percentile_latency_ns": 13882770.0, "characteristics.90th_percentile_latency_s": 0.01388277, "characteristics.90th_percentile_latency_us": 13882.77, "characteristics.accuracy": 64.08, "characteristics.good": 32040, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_160_quant.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 66.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "5f48cd2a35e2de47", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20367954, "90.00 percentile latency (ns)": 148922073, "90th percentile latency (ns)": 148922073, "95.00 percentile latency (ns)": 179249210, "97.00 percentile latency (ns)": 185605834, "99.00 percentile latency (ns)": 194590426, "99.90 percentile latency (ns)": 207254988, "Max latency (ns)": 221414826, "Mean latency (ns)": 46216769, "Min duration satisfied": "Yes", "Min latency (ns)": 18826787, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 21.62, "QPS w/o loadgen overhead": 21.64, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 148.922073, "characteristics.90th_percentile_latency_ns": 148922073.0, "characteristics.90th_percentile_latency_s": 0.148922073, "characteristics.90th_percentile_latency_us": 148922.073, "characteristics.accuracy": 64.282, "characteristics.good": 32141, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.5_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 25.641, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "64a5ba4b7d9be08a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 45663323, "90.00 percentile latency (ns)": 179931655, "90th percentile latency (ns)": 179931655, "95.00 percentile latency (ns)": 190818048, "97.00 percentile latency (ns)": 195054529, "99.00 percentile latency (ns)": 201582608, "99.90 percentile latency (ns)": 215828415, "Max latency (ns)": 228741940, "Mean latency (ns)": 74988155, "Min duration satisfied": "Yes", "Min latency (ns)": 37700791, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 13.33, "QPS w/o loadgen overhead": 13.34, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 179.931655, "characteristics.90th_percentile_latency_ns": 179931655.0, "characteristics.90th_percentile_latency_s": 0.179931655, "characteristics.90th_percentile_latency_us": 179931.655, "characteristics.accuracy": 72.678, "characteristics.good": 36339, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v3-large-minimalistic_224_1.0_float", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v3/checkpoints/v3-large-minimalistic_224_1.0_float.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 13.5135, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "77ee8654fb792332", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 13472327, "90.00 percentile latency (ns)": 16677745, "90th percentile latency (ns)": 16677745, "95.00 percentile latency (ns)": 31798268, "97.00 percentile latency (ns)": 50458982, "99.00 percentile latency (ns)": 150205507, "99.90 percentile latency (ns)": 193721578, "Max latency (ns)": 214138863, "Mean latency (ns)": 17412362, "Min duration satisfied": "Yes", "Min latency (ns)": 12094214, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 57.29, "QPS w/o loadgen overhead": 57.43, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 16.677745, "characteristics.90th_percentile_latency_ns": 16677745.0, "characteristics.90th_percentile_latency_s": 0.016677745, "characteristics.90th_percentile_latency_us": 16677.745, "characteristics.accuracy": 64.972, "characteristics.good": 32486, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_160_75.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 41.6667, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "4ef59e7b55056aea", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 59963586, "90.00 percentile latency (ns)": 182029805, "90th percentile latency (ns)": 182029805, "95.00 percentile latency (ns)": 211403045, "97.00 percentile latency (ns)": 217823881, "99.00 percentile latency (ns)": 227027353, "99.90 percentile latency (ns)": 242318174, "Max latency (ns)": 253149982, "Mean latency (ns)": 81394957, "Min duration satisfied": "Yes", "Min latency (ns)": 50252138, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.28, "QPS w/o loadgen overhead": 12.29, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 182.029805, "characteristics.90th_percentile_latency_ns": 182029805.0, "characteristics.90th_percentile_latency_s": 0.182029805, "characteristics.90th_percentile_latency_us": 182029.805, "characteristics.accuracy": 71.77, "characteristics.good": 35885, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-1.0-224-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-1.0-224-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_1.0_224.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 11.4943, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "425486837bf52fe9", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 30073037, "90.00 percentile latency (ns)": 182199877, "90th percentile latency (ns)": 182199877, "95.00 percentile latency (ns)": 191283729, "97.00 percentile latency (ns)": 194947517, "99.00 percentile latency (ns)": 202214967, "99.90 percentile latency (ns)": 218102169, "Max latency (ns)": 230073624, "Mean latency (ns)": 66258422, "Min duration satisfied": "Yes", "Min latency (ns)": 22349261, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 15.08, "QPS w/o loadgen overhead": 15.09, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 182.199877, "characteristics.90th_percentile_latency_ns": 182199877.0, "characteristics.90th_percentile_latency_s": 0.182199877, "characteristics.90th_percentile_latency_us": 182199.877, "characteristics.accuracy": 66.75, "characteristics.good": 33375, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.75-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.75-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.75_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 21.2766, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "c02a44f2fafddd80", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 10105665, "90.00 percentile latency (ns)": 91087770, "90th percentile latency (ns)": 91087770, "95.00 percentile latency (ns)": 121333015, "97.00 percentile latency (ns)": 134812678, "99.00 percentile latency (ns)": 150460298, "99.90 percentile latency (ns)": 169069212, "Max latency (ns)": 179874001, "Mean latency (ns)": 30959111, "Min duration satisfied": "Yes", "Min latency (ns)": 6209874, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 32.25, "QPS w/o loadgen overhead": 32.3, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 91.08777, "characteristics.90th_percentile_latency_ns": 91087770.0, "characteristics.90th_percentile_latency_s": 0.09108777, "characteristics.90th_percentile_latency_us": 91087.77, "characteristics.accuracy": 47.14, "characteristics.good": 23570, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-96-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-96-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_96.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 71.4286, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "a2a6e173cb1e8b4e", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 17559204, "90.00 percentile latency (ns)": 156599541, "90th percentile latency (ns)": 156599541, "95.00 percentile latency (ns)": 169983837, "97.00 percentile latency (ns)": 175483555, "99.00 percentile latency (ns)": 182867926, "99.90 percentile latency (ns)": 195320377, "Max latency (ns)": 210273243, "Mean latency (ns)": 49918524, "Min duration satisfied": "Yes", "Min latency (ns)": 11373830, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 20.01, "QPS w/o loadgen overhead": 20.03, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 156.599541, "characteristics.90th_percentile_latency_ns": 156599541.0, "characteristics.90th_percentile_latency_s": 0.156599541, "characteristics.90th_percentile_latency_us": 156599.541, "characteristics.accuracy": 56.988, "characteristics.good": 28494, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-160-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-160-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_160.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 18.5185, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "296f77383b81a05c", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 36975938, "90.00 percentile latency (ns)": 108743825, "90th percentile latency (ns)": 108743825, "95.00 percentile latency (ns)": 112301012, "97.00 percentile latency (ns)": 114381960, "99.00 percentile latency (ns)": 118896112, "99.90 percentile latency (ns)": 127578834, "Max latency (ns)": 133596411, "Mean latency (ns)": 54781546, "Min duration satisfied": "Yes", "Min latency (ns)": 15670050, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.23, "QPS w/o loadgen overhead": 18.25, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 108.743825, "characteristics.90th_percentile_latency_ns": 108743825.0, "characteristics.90th_percentile_latency_s": 0.108743825, "characteristics.90th_percentile_latency_us": 108743.825, "characteristics.accuracy": 63.716, "characteristics.good": 31858, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v1-0.75-128-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v1-0.75-128-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2269307/files/mobilenet_v1_0.75_128.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 17.2414, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "58f531bae10a2bc5", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 6556617, "90.00 percentile latency (ns)": 7594362, "90th percentile latency (ns)": 7594362, "95.00 percentile latency (ns)": 8855246, "97.00 percentile latency (ns)": 13378108, "99.00 percentile latency (ns)": 49683963, "99.90 percentile latency (ns)": 169919574, "Max latency (ns)": 194789498, "Mean latency (ns)": 8104579, "Min duration satisfied": "Yes", "Min latency (ns)": 5472514, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 122.88, "QPS w/o loadgen overhead": 123.39, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 7.594362, "characteristics.90th_percentile_latency_ns": 7594362.0, "characteristics.90th_percentile_latency_s": 0.007594362, "characteristics.90th_percentile_latency_us": 7594.362, "characteristics.accuracy": 55.54, "characteristics.good": 27770, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.5-128-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.5-128-quantized", "input_data_types": "int8", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://storage.googleapis.com/mobilenet_v2/checkpoints/quantized_v2_128_50.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 125, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "1702154fc788f9dd", "use_accelerator": false, "weight_data_types": "int8", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 20976984, "90.00 percentile latency (ns)": 165854126, "90th percentile latency (ns)": 165854126, "95.00 percentile latency (ns)": 177221954, "97.00 percentile latency (ns)": 182063616, "99.00 percentile latency (ns)": 190492528, "99.90 percentile latency (ns)": 204728632, "Max latency (ns)": 221266486, "Mean latency (ns)": 55258917, "Min duration satisfied": "Yes", "Min latency (ns)": 14844023, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.08, "QPS w/o loadgen overhead": 18.1, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 165.854126, "characteristics.90th_percentile_latency_ns": 165854126.0, "characteristics.90th_percentile_latency_s": 0.165854126, "characteristics.90th_percentile_latency_us": 165854.126, "characteristics.accuracy": 59.322, "characteristics.good": 29661, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "open", "formal_model": "mobilenet-v2-0.35-192-non-quantized", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 120, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "mobilenet-v2-0.35-192-non-quantized", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/open/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://zenodo.org/record/2266646/files/mobilenet_v2_0.35_192.tgz", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 15.625, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "6d812c8c7b4af8bd", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TFLite" }, { "50.00 percentile latency (ns)": 413086676, "90.00 percentile latency (ns)": 414838695, "90th percentile latency (ns)": 414838695, "95.00 percentile latency (ns)": 415286343, "97.00 percentile latency (ns)": 415812713, "99.00 percentile latency (ns)": 416908249, "99.90 percentile latency (ns)": 425225132, "Max latency (ns)": 426155625, "Mean latency (ns)": 412730167, "Min duration satisfied": "Yes", "Min latency (ns)": 403893708, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.42, "QPS w/o loadgen overhead": 2.42, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 414.838695, "characteristics.90th_percentile_latency_ns": 414838695.0, "characteristics.90th_percentile_latency_s": 0.414838695, "characteristics.90th_percentile_latency_us": 414838.695, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-neon", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/results/firefly-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-neon", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.5, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "9d5cb474ab0b6658", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 589167631, "90.00 percentile latency (ns)": 603680875, "90th percentile latency (ns)": 603680875, "95.00 percentile latency (ns)": 607960147, "97.00 percentile latency (ns)": 611826996, "99.00 percentile latency (ns)": 661061671, "99.90 percentile latency (ns)": 714376068, "Max latency (ns)": 722865773, "Mean latency (ns)": 590196558, "Min duration satisfied": "Yes", "Min latency (ns)": 569764409, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.69, "QPS w/o loadgen overhead": 1.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 603.680875, "characteristics.90th_percentile_latency_ns": 603680875.0, "characteristics.90th_percentile_latency_s": 0.603680875, "characteristics.90th_percentile_latency_us": 603680.875, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 3.4435481215633357, "characteristics.power.normalized_per_core": 0.028696234346361132, "characteristics.power.normalized_per_processor": 3.4435481215633357, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.off-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan off", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 120, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "AMD EPYC 7V13 64-Core Processor", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 120, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/results/rpi4coral-fan.off-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5 LTS (Linux-5.4.0-1055-azure-x86_64-with-Ubuntu-18.04-bionic)", "other_software_stack": "GCC 7.5.0; Python 3.7.10", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by CK v2.5.8 (https://github.com/ctuning/ck)", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.off-tflite-v2.4.1-ruy", "system_name": "Microsoft Corporation 7.0 (Virtual Machine)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.81818, "task": "image classification", "task2": "image classification", "total_cores": 120, "uid": "e2b0b4de3fc43359", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 554806855, "90.00 percentile latency (ns)": 555966181, "90th percentile latency (ns)": 555966181, "95.00 percentile latency (ns)": 556913577, "97.00 percentile latency (ns)": 558372138, "99.00 percentile latency (ns)": 563261714, "99.90 percentile latency (ns)": 578372854, "Max latency (ns)": 581154408, "Mean latency (ns)": 555006161, "Min duration satisfied": "Yes", "Min latency (ns)": 543793798, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.8, "QPS w/o loadgen overhead": 1.8, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "800 MHz", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "4 GiB (shared with host)", "accelerator_memory_configuration": "-", "accelerator_model_name": "Arm Mali-T860 MP4", "accelerator_on-chip_memories": "-", "accelerators_per_node": 1, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 555.966181, "characteristics.90th_percentile_latency_ns": 555966181.0, "characteristics.90th_percentile_latency_s": 0.555966181, "characteristics.90th_percentile_latency_us": 555966.181, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "firefly-armnn-v21.02-opencl", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (OpenCL)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 1, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/results/firefly-armnn-v21.02-opencl", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-armnn-v21.02-opencl", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 2.5, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "fd9c9009485cb7b3", "use_accelerator": true, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 49760932, "90.00 percentile latency (ns)": 68502340, "90th percentile latency (ns)": 68502340, "95.00 percentile latency (ns)": 78511161, "97.00 percentile latency (ns)": 86730642, "99.00 percentile latency (ns)": 96095375, "99.90 percentile latency (ns)": 108083443, "Max latency (ns)": 120593298, "Mean latency (ns)": 55518487, "Min duration satisfied": "Yes", "Min latency (ns)": 47022883, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 18.01, "QPS w/o loadgen overhead": 18.01, "Result is": "VALID", "SUT name": "ArmNN_TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 68.50234, "characteristics.90th_percentile_latency_ns": 68502340.0, "characteristics.90th_percentile_latency_s": 0.06850234, "characteristics.90th_percentile_latency_us": 68502.34, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 1.2861309018079106, "characteristics.power.normalized_per_core": 0.16076636272598882, "characteristics.power.normalized_per_processor": 1.2861309018079106, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-armnn-v21.02-neon", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "ArmNN v21.02 (Neon)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/results/xavier-power.0-fan.cool-armnn-v21.02-neon", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.2", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-armnn-v21.02-neon", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 20, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "7740da597bae46f0", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite -> ArmNN" }, { "50.00 percentile latency (ns)": 75739770, "90.00 percentile latency (ns)": 77975401, "90th percentile latency (ns)": 77975401, "95.00 percentile latency (ns)": 88838337, "97.00 percentile latency (ns)": 90892308, "99.00 percentile latency (ns)": 100776825, "99.90 percentile latency (ns)": 142315902, "Max latency (ns)": 162143685, "Mean latency (ns)": 77278132, "Min duration satisfied": "Yes", "Min latency (ns)": 73726788, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 12.94, "QPS w/o loadgen overhead": 12.94, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "", "accelerator_interconnect": "", "accelerator_interconnect_topology": "", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 77.975401, "characteristics.90th_percentile_latency_ns": 77975401.0, "characteristics.90th_percentile_latency_s": 0.077975401, "characteristics.90th_percentile_latency_us": 77975.401, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 2.1778079688568277, "characteristics.power.normalized_per_core": 0.27222599610710346, "characteristics.power.normalized_per_processor": 2.1778079688568277, "characteristics.total": 50000, "ck_system": "xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "Fan mode: cool", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "32 GB", "host_memory_configuration": "", "host_networking": "", "host_networking_topology": "", "host_processor_caches": "8MB L2 (2MB per dual cluster)/4 MB L3 (shared)", "host_processor_core_count": 8, "host_processor_frequency": "2265.6 MHz", "host_processor_interconnect": "", "host_processor_model_name": "NVIDIA Carmel (ARMv8.2)", "host_processors_per_node": 1, "host_storage_capacity": "400 GB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "Power mode: MAXN", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 8, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/results/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 18.04.5", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.2", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/xavier-power.0-fan.cool-tflite-v2.4.1-ruy", "system_name": "NVIDIA Jetson AGX Xavier", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 11.3636, "task": "image classification", "task2": "image classification", "total_cores": 8, "uid": "949404ebba6b9f9a", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 591282177, "90.00 percentile latency (ns)": 606294547, "90th percentile latency (ns)": 606294547, "95.00 percentile latency (ns)": 611230567, "97.00 percentile latency (ns)": 613858717, "99.00 percentile latency (ns)": 646968602, "99.90 percentile latency (ns)": 727313337, "Max latency (ns)": 729805258, "Mean latency (ns)": 592611844, "Min duration satisfied": "Yes", "Min latency (ns)": 570831810, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 1.69, "QPS w/o loadgen overhead": 1.69, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 606.294547, "characteristics.90th_percentile_latency_ns": 606294547.0, "characteristics.90th_percentile_latency_s": 0.606294547, "characteristics.90th_percentile_latency_us": 606294.547, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.power": 3.970307008260607, "characteristics.power.normalized_per_core": 0.9925767520651517, "characteristics.power.normalized_per_processor": 3.970307008260607, "characteristics.total": 50000, "ck_system": "rpi4coral-fan.on-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "http://www.raspberrypiwiki.com/index.php/Armor_Case_B: fan on", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 128=4x32 KiB, L1D$ 128=4x32 KiB, L2$ 1 MiB", "host_processor_core_count": 4, "host_processor_frequency": "1500 MHz", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP4", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme Pro microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 4, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/results/rpi4coral-fan.on-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 20.04.2; kernel 5.4.0-1032-raspi #35-Ubuntu SMP PREEMPT (Fri Mar 19 20:52:40 UTC 2021)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge 1.55.2", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/rpi4coral-fan.on-tflite-v2.4.1-ruy", "system_name": "Raspberry Pi 4", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.81818, "task": "image classification", "task2": "image classification", "total_cores": 4, "uid": "ff4a688a2f1882b1", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" }, { "50.00 percentile latency (ns)": 450754388, "90.00 percentile latency (ns)": 509104821, "90th percentile latency (ns)": 509104821, "95.00 percentile latency (ns)": 550684956, "97.00 percentile latency (ns)": 583679140, "99.00 percentile latency (ns)": 603389125, "99.90 percentile latency (ns)": 649859307, "Max latency (ns)": 676381492, "Mean latency (ns)": 461404812, "Min duration satisfied": "Yes", "Min latency (ns)": 409320513, "Min queries satisfied": "Yes", "Mode": "PerformanceOnly", "QPS w/ loadgen overhead": 2.17, "QPS w/o loadgen overhead": 2.17, "Result is": "VALID", "SUT name": "TFLite_SUT", "Scenario": "singlestream", "accelerator_frequency": "-", "accelerator_host_interconnect": "-", "accelerator_interconnect": "-", "accelerator_interconnect_topology": "-", "accelerator_memory_capacity": "-", "accelerator_memory_configuration": "-", "accelerator_model_name": "-", "accelerator_on-chip_memories": "-", "accelerators_per_node": 0, "accuracy_log_probability": 0, "accuracy_log_rng_seed": 0, "accuracy_log_sampling_target": 0, "characteristics.90th_percentile_latency_ms": 509.104821, "characteristics.90th_percentile_latency_ns": 509104821.0, "characteristics.90th_percentile_latency_s": 0.509104821, "characteristics.90th_percentile_latency_us": 509104.821, "characteristics.accuracy": 76.442, "characteristics.good": 38221, "characteristics.total": 50000, "ck_system": "firefly-tflite-v2.4.1-ruy", "ck_used": true, "cooling": "on-board fan", "dataset": "ImageNet 2012", "dataset_link": "https://github.com/ctuning/ck/blob/master/docs/mlperf-automation/datasets/imagenet2012.md", "dim_x_default": "characteristics.90th_percentile_latency_ms", "dim_y_default": "characteristics.accuracy", "dim_y_maximize": true, "division": "closed", "formal_model": "resnet50-v1.5", "formal_model_accuracy": 99.0, "formal_model_link": "https://github.com/mlcommons/ck-mlops/tree/main/package", "framework": "TFLite v2.4.1 (ruy)", "host_memory_capacity": "4 GiB", "host_memory_configuration": "-", "host_networking": "-", "host_networking_topology": "-", "host_processor_caches": "L1I$ 48 KiB, L1D$ 32 KiB, L2$ 1 MiB (big); L1I$ 32 KiB, L1D$ 32 KiB, L2$ 512 KiB (LITTLE)", "host_processor_core_count": 6, "host_processor_frequency": "1800 MHz (big), 1400 MHz (LITTLE)", "host_processor_interconnect": "-", "host_processor_model_name": "Arm Cortex-A72 MP2 (big); Arm Cortex-A53 MP4 (LITTLE)", "host_processors_per_node": 1, "host_storage_capacity": "128 GiB", "host_storage_type": "SanDisk Extreme microSD", "hw_notes": "", "informal_model": "resnet50", "input_data_types": "fp32", "key.accuracy": "characteristics.accuracy", "max_async_queries": 1, "max_duration (ms)": 0, "max_query_count": 0, "min_duration (ms)": 600000, "min_query_count": 1024, "mlperf_version": 1.0, "normalize_cores": 6, "normalize_processors": 1, "note_code": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/code", "note_details": "https://github.com/mlcommons/inference_results_v1.0/tree/master/closed/Krai/results/firefly-tflite-v2.4.1-ruy", "number_of_nodes": 1, "operating_system": "Ubuntu 16.04.7 LTS; kernel 4.4.77 #554 (Thu Nov 30 11:30:11 HKT 2017)", "other_software_stack": "", "performance_issue_same": 0, "performance_issue_same_index": 0, "performance_issue_unique": 0, "performance_sample_count": 1024, "print_timestamps": 0, "problem": false, "qsl_rng_seed": 7322528924094909334, "retraining": "no", "sample_index_rng_seed": 1570999273408051088, "samples_per_query": 1, "schedule_rng_seed": 3507442325620259414, "starting_weights_filename": "https://www.dropbox.com/s/vhuqo0wc39lky0a/resnet50_v1.no-argmax.tflite", "status": "available", "submitter": "Krai", "submitter_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.submitter/Krai", "sw_notes": "Powered by Collective Knowledge v1.17.0", "system_link": "https://github.com/ctuning/ck-mlperf-inference/tree/main/bench.mlperf.system/firefly-tflite-v2.4.1-ruy", "system_name": "Firefly-RK3399 (firefly)", "system_type": "edge", "target_latency (ns)": 0, "target_qps": 1.83486, "task": "image classification", "task2": "image classification", "total_cores": 6, "uid": "0da6b3c5836bcdcf", "use_accelerator": false, "weight_data_types": "fp32", "weight_transformations": "TF -> TFLite" } ]