AM69A: edgeai-benchmark benchmarking on target with modelzoo model artifacts

Part Number: AM69A
Other Parts Discussed in Thread: AM68A

Tool/software:

Hi all,

I am running into problems when benchmarking on the AM69A target with edgeai-benchmark to determine inference time in ms. There are error messages in the log shown below.

Target side benchmarking log:

root@am69-sk:/mnt/edgeai-benchmark# ./run_benchmarks_evm.sh 
TARGET_SOC:     AM69A
TARGET_MACHINE: evm
DEBUG MODE:     false @ am69-sk:5678
TIDL_TOOLS_PATH=/mnt/edgeai-benchmark/tools/AM69A/tidl_tools
LD_LIBRARY_PATH=/mnt/edgeai-benchmark/tools/AM69A/tidl_tools
PYTHONPATH=:/usr/lib/python3.12/site-packages/
===================================================================
argv: ['./scripts/generate_models_list.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM69A', '--models_list_file', './work_dirs/mod
elartifacts/benchmarks_models_list.txt', '--dataset_loading', 'False']
settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/AM69A', 'mo
delpackage_path': './work_dirs/modelpackage/AM69A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM69A', 'target_machine': 
'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:qua
ntization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 2
00, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-822
0', 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnx
rt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': 'coco', 'dataset_loading': ['False'], 'config
_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'experimental_models': False, 'rewrite_results': False, 'with
_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': Non
e, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 'param_template_file': None, 'settings_file': '
settings_infer_on_evm.yaml', 'models_list_file': './work_dirs/modelartifacts/benchmarks_models_list.txt', 'basic_keys': ['include_files', 'p
ipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpac
kage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runt
ime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_
keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selecti
on', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture
_log', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'in
put_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'settings_file', 'models_
list_file'], 'dataset_cache': None}
work_dir: ../edgeai-modelzoo/modelartifacts/AM69A/8bits
Using model configs from Python module: ./configs
1
-------------------------------------------------------------------
running MODEL_ID:od-8220
argv: ['./scripts/benchmark_modelzoo.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM69A', '--model_selection', 'od-8220']
settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/AM69A', 'mo
delpackage_path': './work_dirs/modelpackage/AM69A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM69A', 'target_machine': 
'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:qua
ntization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 2
00, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': ['od-82
20'], 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'on
nxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': 'coco', 'dataset_loading': True, 'config_ra
nge': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'experimental_models': False, 'rewrite_results': False, 'with_ud
p': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 
'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 'param_template_file': None, 'settings_file': 'set
tings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'co
nfigs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'p
arallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold
', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_short
list', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loa
ding', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model
_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibrati
on_factor', 'param_template_file', 'settings_file'], 'dataset_cache': None}
work_dir: ../edgeai-modelzoo/modelartifacts/AM69A/8bits
Using model configs from Python module: ./configs

INFO:20241004-172226: loading dataset - category:coco variant:coco
loading annotations into memory...
Done (t=1.67s)
creating index...
index created!
loading annotations into memory...
Done (t=1.38s)
creating index...
index created!
configs to run: ['od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx']
number of configs: 1

INFO:20241004-172233: starting - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
INFO:20241004-172233: model_path - /mnt/edgeai-modelzoo/models/vision/detection/coco/edgeai-mmdet/yolox_s_lite_640x640_20220221_model.onnx
INFO:20241004-172233: model_file - /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_202
20221_model_onnx/model/yolox_s_lite_640x640_20220221_model.onnx
INFO:20241004-172233: quant_file - /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_202
20221_model_onnx/model/yolox_s_lite_640x640_20220221_model_qparams.prototxt

INFO:20241004-172233: running - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
INFO:20241004-172233: pipeline_config - {'task_type': 'detection', 'dataset_category': 'coco', 'calibration_dataset': <edgeai_benchmark.data
sets.coco_det.COCODetection object at 0xffff9df94d40>, 'input_dataset': <edgeai_benchmark.datasets.coco_det.COCODetection object at 0xffff7b
8afa40>, 'preprocess': <edgeai_benchmark.preprocess.PreProcessTransforms object at 0xffff6371fe60>, 'session': <edgeai_benchmark.sessions.on
nxrt_session.ONNXRTSession object at 0xffff6371fec0>, 'postprocess': <edgeai_benchmark.postprocess.PostProcessTransforms object at 0xffff637
34050>, 'metric': {'label_offset_pred': {0: 1, 1: 2, 2: 3, 3: 4, 4: 5, 5: 6, 6: 7, 7: 8, 8: 9, 9: 10, 10: 11, 11: 13, 12: 14, 13: 15, 14: 16
, 15: 17, 16: 18, 17: 19, 18: 20, 19: 21, 20: 22, 21: 23, 22: 24, 23: 25, 24: 27, 25: 28, 26: 31, 27: 32, 28: 33, 29: 34, 30: 35, 31: 36, 32
: 37, 33: 38, 34: 39, 35: 40, 36: 41, 37: 42, 38: 43, 39: 44, 40: 46, 41: 47, 42: 48, 43: 49, 44: 50, 45: 51, 46: 52, 47: 53, 48: 54, 49: 55
, 50: 56, 51: 57, 52: 58, 53: 59, 54: 60, 55: 61, 56: 62, 57: 63, 58: 64, 59: 65, 60: 67, 61: 70, 62: 72, 63: 73, 64: 74, 65: 75, 66: 76, 67
: 77, 68: 78, 69: 79, 70: 80, 71: 81, 72: 82, 73: 84, 74: 85, 75: 86, 76: 87, 77: 88, 78: 89, 79: 90, 80: 91}}, 'model_info': {'metric_refer
ence': {'accuracy_ap[.5:.95]%': 38.3}, 'model_shortlist': 10}}
INFO:20241004-172235: infer  - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - this may take some time...libtidl
_onnxrt_EP loaded 0x289d1640 
Final number of subgraphs created are : 1, - Offloaded Nodes - 283, Total Nodes - 283 
APP: Init ... !!!
   569.481422 s: MEM: Init ... !!!
   569.481467 s: MEM: Initialized DMA HEAP (fd=6) !!!
   569.481605 s: MEM: Init ... Done !!!
   569.481627 s: IPC: Init ... !!!
   569.515808 s: IPC: Init ... Done !!!
REMOTE_SERVICE: Init ... !!!
REMOTE_SERVICE: Init ... Done !!!
   569.528198 s: GTC Frequency = 200 MHz
APP: Init ... Done !!!
   569.532463 s:  VX_ZONE_INIT:Enabled
   569.532475 s:  VX_ZONE_ERROR:Enabled
   569.532482 s:  VX_ZONE_WARNING:Enabled
   569.535955 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-0 
   569.536055 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-1 
   569.536145 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-2 
   569.536222 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-3 
   569.536234 s:  VX_ZONE_INIT:[tivxInitLocal:136] Initialization Done !!!
   569.545360 s:  VX_ZONE_INIT:[tivxHostInitLocal:106] Initialization Done for HOST !!!
TIDL_RT_OVX: ERROR: Config file size (375832 bytes) does not match size of sTIDL_IOBufDesc_t (378392 bytes)
   569.556562 s:  VX_ZONE_ERROR:[tivxAddKernelTIDL:269] invalid values for num_input_tensors or num_output_tensors 
   569.569444 s:  VX_ZONE_ERROR:[vxQueryKernel:159] Invalid kernel reference
   569.569484 s:  VX_ZONE_ERROR:[vxMapUserDataObject:389] Invalid user data object reference
   569.569496 s:  VX_ZONE_ERROR:[vxUnmapUserDataObject:474] Invalid user data object reference
   569.569533 s:  VX_ZONE_ERROR:[vxCreateNodeByStructure:91] failed to retrieve kernel enum 0
   569.569548 s:  VX_ZONE_ERROR:[vxSetReferenceName:970] Invalid reference
   569.569557 s:  VX_ZONE_ERROR:[vxSetReferenceName:970] Invalid reference
   569.569564 s:  VX_ZONE_ERROR:[vxSetReferenceName:970] Invalid reference
infer : od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x64|          |     0% 0/100| [< ]2024-10-04 17:22:38.080039566 [E:onnxruntime:, se
quential_executor.cc:494 ExecuteKernel] Non-zero status code returned while running TIDL_0 node. Name:'TIDLExecutionProvider_TIDL_0_0' Statu
s Message: cannot create std::vector larger than max_size()
infer : od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x64|   0%|          || 0/100 [00:00<?, ?it/s]
Traceback (most recent call last):
  File "/mnt/edgeai-benchmark/edgeai_benchmark/pipelines/pipeline_runner.py", line 203, in _run_pipeline
    result = cls._run_pipeline_impl(basic_settings, pipeline_config, description)
             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/mnt/edgeai-benchmark/edgeai_benchmark/pipelines/pipeline_runner.py", line 176, in _run_pipeline_impl
    accuracy_result = accuracy_pipeline(description)
                      ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/mnt/edgeai-benchmark/edgeai_benchmark/pipelines/accuracy_pipeline.py", line 87, in __call__
    param_result = self._run(description=description)
                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/mnt/edgeai-benchmark/edgeai_benchmark/pipelines/accuracy_pipeline.py", line 138, in _run
    output_list = self._infer_frames(description)
                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/mnt/edgeai-benchmark/edgeai_benchmark/pipelines/accuracy_pipeline.py", line 207, in _infer_frames
    output, info_dict = self._run_with_log(session.infer_frame, data, info_dict)
                        ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/mnt/edgeai-benchmark/edgeai_benchmark/pipelines/accuracy_pipeline.py", line 282, in _run_with_log
    return func(*args, **kwargs)
           ^^^^^^^^^^^^^^^^^^^^^
  File "/mnt/edgeai-benchmark/edgeai_benchmark/sessions/onnxrt_session.py", line 112, in infer_frame
    outputs = self.interpreter.run(output_keys, input_dict)
              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/usr/lib/python3.12/site-packages/onnxruntime/capi/onnxruntime_inference_collection.py", line 200, in run
    return self._sess.run(output_names, input_feed, run_options)
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
onnxruntime.capi.onnxruntime_pybind11_state.RuntimeException: [ONNXRuntimeError] : 6 : RUNTIME_EXCEPTION : Non-zero status code returned whi
le running TIDL_0 node. Name:'TIDLExecutionProvider_TIDL_0_0' Status Message: cannot create std::vector larger than max_size()
[ONNXRuntimeError] : 6 : RUNTIME_EXCEPTION : Non-zero status code returned while running TIDL_0 node. Name:'TIDLExecutionProvider_TIDL_0_0' 
Status Message: cannot create std::vector larger than max_size()
   570.534894 s:  VX_ZONE_ERROR:[ownReleaseReferenceInt:594] Invalid reference
   570.534986 s:  VX_ZONE_ERROR:[vxRemoveKernel:306] Invalid kernel reference
   570.535079 s:  VX_ZONE_ERROR:[ownReleaseReferenceInt:594] Invalid reference
   570.537207 s:  VX_ZONE_INIT:[tivxHostDeInitLocal:120] De-Initialization Done for HOST !!!
   570.541838 s:  VX_ZONE_INIT:[tivxDeInitLocal:206] De-Initialization Done !!!
APP: Deinit ... !!!
REMOTE_SERVICE: Deinit ... !!!
REMOTE_SERVICE: Deinit ... Done !!!
   570.542765 s: IPC: Deinit ... !!!
   570.543725 s: IPC: DeInit ... Done !!!
   570.543755 s: MEM: Deinit ... !!!
   570.543767 s: DDR_SHARED_MEM: Alloc's: 4 alloc's of 11170964 bytes 
   570.543775 s: DDR_SHARED_MEM: Free's : 4 free's  of 11170964 bytes 
   570.543782 s: DDR_SHARED_MEM: Open's : 0 allocs  of 0 bytes 
   570.543794 s: MEM: Deinit ... Done !!!
APP: Deinit ... Done !!!
-------------------------------------------------------------------
settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/', 'modelpa
ckage_path': './work_dirs/modelpackage/', 'datasets_path': './dependencies/datasets', 'target_device': None, 'target_machine': 'evm', 'run_s
uffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': None, 'run_import': False, 'run_inf
erence': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top
_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-8220', 'model_shortlist': None, 'model_exclusion': None, 't
ask_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_
type_dict': None, 'dataset_selection': 'coco', 'dataset_loading': True, 'config_range': None, 'enable_logging': True, 'verbose': False, 'cap
ture_log': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict':
 None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 
'fast_calibration_factor': None, 'param_template_file': None, 'skip_pattern': '_package', 'settings_file': 'settings_infer_on_evm.yaml', 'ba
sic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', '
modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_p
rocesses', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detect
ion_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'ta
sk_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enabl
e_logging', 'verbose', 'capture_log', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'repor
t_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_f
ile', 'skip_pattern', 'settings_file'], 'dataset_cache': None}
results found for 1 models
Report generated at ../edgeai-modelzoo/modelartifacts/
-------------------------------------------------------------------

Setup:

[] edgeai-tensorlab on branch r9.2

[] Target setup with edgeai linux sdk 10.0 and python environment per instructions, I will insert the pip3 list below

[] Model used is the od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx, the artifacts were downloaded to the modelzoo and then extracted.

[] confirmed that there is no result.yaml file in artifacts

[] modified settings_base.yaml to point artifacts to modelzoo

[] nfs mounted edgeai-benchmark and edgeai-modelzoo to the AM69A target

pip3 list

root@am69-sk:/mnt/edgeai-benchmark# pip3 list
Package           Version
----------------- ---------------
aiofiles          23.2.1
anyio             4.3.0
cffi              1.16.0
click             8.1.7
colorama          0.4.6
contourpy         1.3.0
cycler            0.12.1
Cython            3.0.11
debugpy           1.8.6
dlr               1.13.0
fonttools         4.54.1
gpiod             2.1.3
h11               0.14.0
h5py              3.12.1
idna              3.6
iniconfig         2.0.0
joblib            1.4.2
json-tricks       3.17.3
kiwisolver        1.4.7
Mako              1.3.2
MarkupSafe        2.1.5
matplotlib        3.9.2
meson             1.3.1
munkres           1.1.4
numpy             1.26.4
onnx              1.17.0
onnxruntime-tidl  1.14.0+10000005
packaging         23.2
pillow            10.3.0
pip               24.0
pluggy            1.5.0
ply               3.11
plyfile           1.1
protobuf          5.28.2
psutil            5.9.8
pybind11          2.11.1
pycairo           1.26.0
pycocotools       2.0.8
pycparser         2.21
pydantic          1.10.16
Pygments          2.17.2
PyGObject         3.46.0
pyparsing         3.1.4
pytest            8.3.3
python-dateutil   2.9.0.post0
python-multipart  0.0.5
PyYAML            6.0.1
scikit-learn      1.5.2
scipy             1.14.1
setuptools        69.1.1
six               1.16.0
sniffio           1.3.0
starlette         0.37.2
tflite-runtime    2.12.0
threadpoolctl     3.5.0
TI.GPIO           2.0.0
tqdm              4.66.5
typing_extensions 4.10.0
uvicorn           0.30.1
websocket-client  1.7.0
websockets        12.0
wheel             0.42.0
wurlitzer         3.1.1
yamlloader        1.4.1

settings_base.yaml changes

(ti-edgeai-benchmark) gunter@Linux-005:~/ti-edgeai/edgeai-tensorlab/edgeai-benchmark$ diff -Nurp settings_base.yaml.orig settings_base.yaml
--- settings_base.yaml.orig	2024-09-24 16:22:29.435917600 -0700
+++ settings_base.yaml	2024-10-04 10:11:40.570659833 -0700
@@ -13,7 +13,7 @@ target_device : null
 tensor_bits : 8
 
 # number of frames for inference
-num_frames : 1000 #10000 #50000
+num_frames : 100 #1000 #10000 #50000
 
 # number of frames to be used for post training quantization / calibration
 calibration_frames : 25 #50
@@ -38,7 +38,8 @@ models_path : '../edgeai-modelzoo/models
 datasets_path : './dependencies/datasets'
 
 # path where precompiled modelartifacts are placed
-modelartifacts_path : './work_dirs/modelartifacts/{target_device}'
+#modelartifacts_path : './work_dirs/modelartifacts/{target_device}'
+modelartifacts_path : '../edgeai-modelzoo/modelartifacts/{target_device}'
 
 # path where the packaged precompiled modelartifacts are placed
 modelpackage_path : './work_dirs/modelpackage/{target_device}'
@@ -52,7 +53,7 @@ session_type_dict : {'onnx':'onnxrt', 't
 #   examples: ['resnet18.onnx', 'resnet50_v1.tflite'] ['classification'] ['imagenet1k'] ['torchvision'] ['coco']
 #   examples: [cl-0000, od-2020, ss-2580, cl-3090, od-5120, ss-5710, cl-6360, od-8020, od-8200, od-8220, od-8420, ss-8610, kd-7060, 3dod-7100, 6dpose-7200, ss-7618]
 #   examples: [cl-0000, od-2020, cl-6360, od-8200, od-8270, od-8410, ss-8610, ss-8630, ss-8710, ss-8720]
-model_selection : null
+model_selection : od-8220
 
 # model_shortlist can be a number, which indicates a predefined shortlist, and a fraction of the models will be selected
 # model_shortlist and model_selection are complimentary - they can be used together.
@@ -78,7 +79,7 @@ runtime_selection : null
 # set this to null to run all the models
 # example: ['coco']
 # example: ['imagenet', 'coco', 'cocoseg21', 'ade20k', 'cocokpts', 'kitti_lidar_det', 'ti-robokit_semseg_zed1hd', 'ycbv']
-dataset_selection : null
+dataset_selection : coco
 
 # use TIDL offload to speedup inference
 tidl_offload : True
 

What could be missing in this setup? I purposefully chose a straight forward model directly from the modelzoo, to just isolate any issues with the targetside benchmarking.

Thanks!

--Gunter

  • Hi all,

    I have another run, after using a fresh edgeai sdk v10.0 sdcard, and fresh install of the python dependencies.

    root@am69-sk:/mnt/edgeai-benchmark# ./run_benchmarks_evm.sh AM69A
    TARGET_SOC:     AM69A
    TARGET_MACHINE: evm
    DEBUG MODE:     false @ am69-sk:5678
    TIDL_TOOLS_PATH=/mnt/edgeai-benchmark/tools/AM69A/tidl_tools
    LD_LIBRARY_PATH=/mnt/edgeai-benchmark/tools/AM69A/tidl_tools
    PYTHONPATH=:/usr/lib/python3.12/site-packages/
    ===================================================================
    argv: ['./scripts/generate_models_list.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM69A', '--models_list_file', './work_dirs/mod
    elartifacts/benchmarks_models_list.txt', '--dataset_loading', 'False']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
    onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/AM69A', 'mo
    delpackage_path': './work_dirs/modelpackage/AM69A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM69A', 'target_machine': 
    'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:qua
    ntization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 2
    00, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-822
    0', 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnx
    rt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': {'imagenet': 'imagenetv2c'}, 'dataset_selection': 'coco', 'dataset_loadi
    ng': False, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_
    models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 
    'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 
    'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'models_list_file': './work_dirs/modelartifacts/benchmarks_model
    s_list.txt', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 
    'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devic
    es', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection
    _top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model
    _exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'confi
    g_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test'
    , 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_c
    alibration_factor', 'param_template_file', 'settings_file', 'models_list_file'], 'dataset_cache': None}
    work_dir: ../edgeai-modelzoo/modelartifacts/AM69A/8bits
    Using model configs from Python module: ./configs
    1
    -------------------------------------------------------------------
    running MODEL_ID:od-8220
    argv: ['./scripts/benchmark_modelzoo.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM69A', '--run_import', 'False', '--model_select
    ion', 'od-8220']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
    onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/AM69A', 'mo
    delpackage_path': './work_dirs/modelpackage/AM69A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM69A', 'target_machine': 
    'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:qua
    ntization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 2
    00, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': ['od-82
    20'], 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'on
    nxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': {'imagenet': 'imagenetv2c'}, 'dataset_selection': 'coco', 'dataset_loa
    ding': True, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental
    _models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False,
     'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5,
     'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 
    'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 
    'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', '
    run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', '
    num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'da
    taset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', '
    experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_opti
    mization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'settings_file'], 'dataset_cache'
    : None}
    work_dir: ../edgeai-modelzoo/modelartifacts/AM69A/8bits
    Using model configs from Python module: ./configs
    
    INFO:20241009-154731: loading dataset - category:coco variant:coco
    
    INFO:20241009-154731: dataset exists - will reuse - ./dependencies/datasets/coco
    loading annotations into memory...
    Done (t=1.81s)
    creating index...
    index created!
    loading annotations into memory...
    Done (t=1.42s)
    creating index...
    index created!
    configs to run: ['od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx']
    number of configs: 1
    
    INFO:20241009-154808: starting - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241009-154808: model_path - /mnt/edgeai-modelzoo/models/vision/detection/coco/edgeai-mmdet/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241009-154808: model_file - /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_202
    20221_model_onnx/model/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241009-154808: quant_file - /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_202
    20221_model_onnx/model/yolox_s_lite_640x640_20220221_model_qparams.prototxt
    
    INFO:20241009-154808: running - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241009-154808: pipeline_config - {'task_type': 'detection', 'dataset_category': 'coco', 'calibration_dataset': <edgeai_benchmark.data
    sets.coco_det.COCODetection object at 0xffff6c2b4320>, 'input_dataset': <edgeai_benchmark.datasets.coco_det.COCODetection object at 0xffff6a
    99a630>, 'preprocess': <edgeai_benchmark.preprocess.PreProcessTransforms object at 0xffff6a9eb920>, 'session': <edgeai_benchmark.sessions.on
    nxrt_session.ONNXRTSession object at 0xffff6a9eb980>, 'postprocess': <edgeai_benchmark.postprocess.PostProcessTransforms object at 0xffff6a9
    ebad0>, 'metric': {'label_offset_pred': {0: 1, 1: 2, 2: 3, 3: 4, 4: 5, 5: 6, 6: 7, 7: 8, 8: 9, 9: 10, 10: 11, 11: 13, 12: 14, 13: 15, 14: 16
    , 15: 17, 16: 18, 17: 19, 18: 20, 19: 21, 20: 22, 21: 23, 22: 24, 23: 25, 24: 27, 25: 28, 26: 31, 27: 32, 28: 33, 29: 34, 30: 35, 31: 36, 32
    : 37, 33: 38, 34: 39, 35: 40, 36: 41, 37: 42, 38: 43, 39: 44, 40: 46, 41: 47, 42: 48, 43: 49, 44: 50, 45: 51, 46: 52, 47: 53, 48: 54, 49: 55
    , 50: 56, 51: 57, 52: 58, 53: 59, 54: 60, 55: 61, 56: 62, 57: 63, 58: 64, 59: 65, 60: 67, 61: 70, 62: 72, 63: 73, 64: 74, 65: 75, 66: 76, 67
    : 77, 68: 78, 69: 79, 70: 80, 71: 81, 72: 82, 73: 84, 74: 85, 75: 86, 76: 87, 77: 88, 78: 89, 79: 90, 80: 91}}, 'model_info': {'metric_refer
    ence': {'accuracy_ap[.5:.95]%': 38.3}, 'model_shortlist': 10, 'compact_name': 'yolox-s-lite-mmdet-coco-640x640', 'shortlisted': True, 'recom
    mended': True}}
    INFO:20241009-154809: infer  - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - this may take some time...libtidl
    _onnxrt_EP loaded 0xbba1450 
    Final number of subgraphs created are : 1, - Offloaded Nodes - 283, Total Nodes - 283 
    APP: Init ... !!!
       314.627590 s: MEM: Init ... !!!
       314.627641 s: MEM: Initialized DMA HEAP (fd=6) !!!
       314.627783 s: MEM: Init ... Done !!!
       314.627803 s: IPC: Init ... !!!
       314.662636 s: IPC: Init ... Done !!!
    REMOTE_SERVICE: Init ... !!!
    REMOTE_SERVICE: Init ... Done !!!
       314.672399 s: GTC Frequency = 200 MHz
    APP: Init ... Done !!!
       314.674057 s:  VX_ZONE_INIT:Enabled
       314.674069 s:  VX_ZONE_ERROR:Enabled
       314.674076 s:  VX_ZONE_WARNING:Enabled
       314.676068 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-0 
       314.676188 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-1 
       314.676265 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-2 
       314.676360 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-3 
       314.676371 s:  VX_ZONE_INIT:[tivxInitLocal:136] Initialization Done !!!
       314.679040 s:  VX_ZONE_INIT:[tivxHostInitLocal:106] Initialization Done for HOST !!!
    TIDL_RT_OVX: ERROR: Config file size (375832 bytes) does not match size of sTIDL_IOBufDesc_t (378392 bytes)
       314.683529 s:  VX_ZONE_ERROR:[tivxAddKernelTIDL:269] invalid values[  305.537804] kauditd_printk_skb: 5 callbacks suppressed
     for num_input_tensors or num_output_tensors 
       314.695996 s: [  305.537812] audit: type=1701 audit(1728488890.831:28): auid=4294967295 uid=0 gid=0 ses=4294967295 pid=1523 comm="python3
    " exe="/usr/bin/python3.12" sig=11 res=1
     VX_ZONE_ERROR:[vxQueryKernel:159] Invalid kernel reference
       314.696034 s:  VX_ZONE_ERROR:[vxMapUserDataObject:389] Invalid user data object reference
       314.696046 s:  VX_ZONE_ERROR:[vxUn[  305.583923] audit: type=1334 audit(1728488890.879:29): prog-id=23 op=LOAD
    mapUserDataObject:474] Invalid user data object reference
       31[  305.590952] audit: type=1334 audit(1728488890.887:30): prog-id=24 op=LOAD
    4.696083 s:  VX_ZONE_ERROR:[vxCreateNodeByStructure:91] failed t[  305.603270] audit: type=1334 audit(1728488890.899:31): prog-id=25 op=LOAD
    o retrieve kernel enum 0
       314.696098 s:  VX_ZONE_ERROR:[vxSetReferenceName:970] Invalid reference
       314.696107 s:  VX_ZONE_ERROR:[vxSetReferenceName:970] Invalid reference
       314.696114 s:  VX_ZONE_ERROR:[vxSetReferenceName:970] Invalid reference
    infer : od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x64|          |     0% 0/100| [< ]./run_benchmarks_evm.sh: line 146:  1523 Segmenta
    tion fault      (core dumped) python3 ${PYARGS2} --model_selection $MODEL_ID
    -------------------------------------------------------------------
    [  609.594296] audit: type=1334 audit(1728489194.892:32): prog-id=23 op=UNLOAD
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
    onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/', 'modelpa
    ckage_path': './work_dirs/modelpackage/', 'datasets_path': './dependencies/datasets', 'target_device': None, 'target_machine': 'evm', 'run_s
    uffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': None, 'run_import': False, 'run_inf
    erence': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top
    _k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-8220', 'model_shortlist': None, 'model_exclusion': None, 't
    ask_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_
    type_dict': {'imagenet': 'imagenetv2c'}, 'dataset_selection': 'coco', 'dataset_loading': True, 'config_range': None, 'enable_logging': True,
     'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': Tru
    e, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_di
    r_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': None, 'param_template_file': None, 'skip_pattern': '_package',
     'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibr
    ation_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_mach
    ine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing'
    , 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_se
    lection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_se
    lection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrit
    e_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_dept
    h', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'skip_pattern', 'settings_file'], 'dataset_cache': None}
    results found for 1 models
    Report generated at ../edgeai-modelzoo/modelartifacts/
    -------------------------------------------------------------------
    
    

    The python environment was

    root@am69-sk:/mnt/edgeai-benchmark# pip3 list
    Package           Version
    ----------------- ---------------
    aiofiles          23.2.1
    anyio             4.3.0
    cffi              1.16.0
    click             8.1.7
    colorama          0.4.6
    contourpy         1.3.0
    cycler            0.12.1
    Cython            3.0.11
    debugpy           1.8.6
    dlr               1.13.0
    fonttools         4.54.1
    gpiod             2.1.3
    h11               0.14.0
    idna              3.6
    iniconfig         2.0.0
    joblib            1.4.2
    json-tricks       3.17.3
    kiwisolver        1.4.7
    Mako              1.3.2
    MarkupSafe        2.1.5
    matplotlib        3.9.2
    meson             1.3.1
    munkres           1.1.4
    numpy             1.26.4
    onnxruntime-tidl  1.14.0+10000005
    packaging         23.2
    pillow            10.3.0
    pip               24.0
    pluggy            1.5.0
    ply               3.11
    plyfile           1.1
    psutil            5.9.8
    pybind11          2.11.1
    pycairo           1.26.0
    pycocotools       2.0.8
    pycparser         2.21
    pydantic          1.10.16
    Pygments          2.17.2
    PyGObject         3.46.0
    pyparsing         3.1.4
    pytest            8.3.3
    python-dateutil   2.9.0.post0
    python-multipart  0.0.5
    PyYAML            6.0.1
    scikit-learn      1.5.2
    scipy             1.14.1
    setuptools        69.1.1
    six               1.16.0
    sniffio           1.3.0
    starlette         0.37.2
    tflite-runtime    2.12.0
    threadpoolctl     3.5.0
    TI.GPIO           2.0.0
    tqdm              4.66.5
    typing_extensions 4.10.0
    uvicorn           0.30.1
    websocket-client  1.7.0
    websockets        12.0
    wheel             0.42.0
    wurlitzer         3.1.1
    yamlloader        1.4.1
    

    Everything else is the same as in the post at the beginning.

    Something that seems to be the start of the problem is the following line

    TIDL_RT_OVX: ERROR: Config file size (375832 bytes) does not match size of sTIDL_IOBufDesc_t (378392 bytes)

    After that the VX_ZONE_ERROR errors happen and things go south.

    The target is stuck at zero iteration, and a segmentation fault happens after about 2 min.

    What is the root cause of the VX_ZONE_ERROR?

    Regards,

    --Gunter

  • Hi Gunter,

    I am still working on getting this set up on my end due to a few things that delayed my progress in the office. Have you tried this with git branch r10.0?

    Thank you,

    Fabiana

  • Hi Fabiana,

    yes, I have tested this with branch r10.0 in the second run with the above results. Sorry, I should have mentioned that.

    Regards,

    --Gunter

  • Hi Gunter,

    I don't have the AM69A EVM/StarterKit with me right now, so I tested on AM68A instead using the precompiled model. It seems to be working on AM68A EVM. 

    1.. copied the modelartifacts link od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz.link

    from edgeai-modelzoo/modelartifacts/AM68A/8bits/

    and placed it under edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/

    These are the modifications that I did in edgeai-benchmark/settings_base.yaml:

    2. select only the model of interest instead of all the models:

    model_selection : od-8220

    3. I did the following for a quick test - just run 100 frames inference instead of all 5000 frames:

    num_frames: 100

    4. ssh into AM68A EVM, mounted edgeai-benchmark from my PC and ran the script

    5. Here is the log from the EVM/StarterKit:

    oot@am68a-sk:/mnt/edgeai-benchmark# ./run_benchmarks_evm.sh AM68A
    TARGET_SOC: AM68A
    TARGET_MACHINE: evm
    DEBUG MODE: false @ am68a-sk:5678
    Entering: ./work_dirs/modelartifacts/AM68A/8bits/ss-5710_tvmdlr_cocoseg21_edgeai-tv_deeplabv3plus_mobilenetv2_edgeailite_512x512_20210405_onnx.tar.gz.link
    run_set_target_machine.sh: line 94: cd: ./work_dirs/modelartifacts/AM68A/8bits/ss-5710_tvmdlr_cocoseg21_edgeai-tv_deeplabv3plus_mobilenetv2_edgeailite_512x512_20210405_onnx.tar.gz.link/artifacts: Not a directory
    Entering: ./work_dirs/modelartifacts/AM68A/8bits/cl-3090_tvmdlr_imagenet1k_torchvision_mobilenet_v2_tv_onnx.tar.gz.link
    run_set_target_machine.sh: line 94: cd: ./work_dirs/modelartifacts/AM68A/8bits/cl-3090_tvmdlr_imagenet1k_torchvision_mobilenet_v2_tv_onnx.tar.gz.link/artifacts: Not a directory
    Entering: ./work_dirs/modelartifacts/AM68A/8bits/od-5120_tvmdlr_coco_tf1-models_ssdlite_mobiledet_dsp_320x320_coco_20200519_tflite.tar.gz.link
    run_set_target_machine.sh: line 94: cd: ./work_dirs/modelartifacts/AM68A/8bits/od-5120_tvmdlr_coco_tf1-models_ssdlite_mobiledet_dsp_320x320_coco_20200519_tflite.tar.gz.link/artifacts: Not a directory
    TIDL_TOOLS_PATH=/mnt/edgeai-benchmark/tools/AM68A/tidl_tools
    LD_LIBRARY_PATH=/mnt/edgeai-benchmark/tools/AM68A/tidl_tools
    PYTHONPATH=:/usr/lib/python3.12/site-packages/
    ===================================================================
    argv: ['./scripts/generate_models_list.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM68A', '--models_list_file', './work_dirs/modelartifacts/benchmarks_models_list.txt', '--dataset_loading', 'False']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'configs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': './work_dirs/modelartifacts/AM68A', 'modelpackage_path': './work_dirs/modelpackage/AM68A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM68A', 'target_machine': 'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:quantization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-8220', 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': None, 'dataset_loading': False, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'models_list_file': './work_dirs/modelartifacts/benchmarks_models_list.txt', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'settings_file', 'models_list_file'], 'dataset_cache': None}
    work_dir: ./work_dirs/modelartifacts/AM68A/8bits
    Using model configs from Python module: ./configs
    1
    -------------------------------------------------------------------
    running MODEL_ID:od-8220
    argv: ['./scripts/benchmark_modelzoo.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM68A', '--run_import', 'False', '--model_selection', 'od-8220']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'configs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': './work_dirs/modelartifacts/AM68A', 'modelpackage_path': './work_dirs/modelpackage/AM68A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM68A', 'target_machine': 'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:quantization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': ['od-8220'], 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': None, 'dataset_loading': True, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'settings_file'], 'dataset_cache': None}
    work_dir: ./work_dirs/modelartifacts/AM68A/8bits
    Using model configs from Python module: ./configs

    INFO:20241011-103202: loading dataset - category:coco variant:coco

    INFO:20241011-103202: dataset exists - will reuse - ./dependencies/datasets/coco
    loading annotations into memory...
    Done (t=1.48s)
    creating index...
    index created!
    loading annotations into memory...
    Done (t=1.53s)
    creating index...
    index created!
    configs to run: ['od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx']
    number of configs: 1

    INFO:20241011-103239: starting - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    Downloading software-dl.ti.com/.../od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz to /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz
    41328640it [00:10, 3894883.00it/s]
    Extracting /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz to /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241011-103252: model_path - /mnt/edgeai-modelzoo/models/vision/detection/coco/edgeai-mmdet/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241011-103252: model_file - /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx/model/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241011-103252: quant_file - /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx/model/yolox_s_lite_640x640_20220221_model_qparams.prototxt

    INFO:20241011-103252: running - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241011-103252: pipeline_config - {'task_type': 'detection', 'dataset_category': 'coco', 'calibration_dataset': <edgeai_benchmark.datasets.coco_det.COCODetection object at 0xffff7e698c80>, 'input_dataset': <edgeai_benchmark.datasets.coco_det.COCODetection object at 0xffff7e69bbc0>, 'preprocess': <edgeai_benchmark.preprocess.PreProcessTransforms object at 0xffff7e653e90>, 'session': <edgeai_benchmark.sessions.onnxrt_session.ONNXRTSession object at 0xffff7e653ef0>, 'postprocess': <edgeai_benchmark.postprocess.PostProcessTransforms object at 0xffff7e668080>, 'metric': {'label_offset_pred': {0: 1, 1: 2, 2: 3, 3: 4, 4: 5, 5: 6, 6: 7, 7: 8, 8: 9, 9: 10, 10: 11, 11: 13, 12: 14, 13: 15, 14: 16, 15: 17, 16: 18, 17: 19, 18: 20, 19: 21, 20: 22, 21: 23, 22: 24, 23: 25, 24: 27, 25: 28, 26: 31, 27: 32, 28: 33, 29: 34, 30: 35, 31: 36, 32: 37, 33: 38, 34: 39, 35: 40, 36: 41, 37: 42, 38: 43, 39: 44, 40: 46, 41: 47, 42: 48, 43: 49, 44: 50, 45: 51, 46: 52, 47: 53, 48: 54, 49: 55, 50: 56, 51: 57, 52: 58, 53: 59, 54: 60, 55: 61, 56: 62, 57: 63, 58: 64, 59: 65, 60: 67, 61: 70, 62: 72, 63: 73, 64: 74, 65: 75, 66: 76, 67: 77, 68: 78, 69: 79, 70: 80, 71: 81, 72: 82, 73: 84, 74: 85, 75: 86, 76: 87, 77: 88, 78: 89, 79: 90, 80: 91}}, 'model_info': {'metric_reference': {'accuracy_ap[.5:.95]%': 38.3}, 'model_shortlist': 10, 'compact_name': 'yolox-s-lite-mmdet-coco-640x640', 'shortlisted': True, 'recommended': True}}
    INFO:20241011-103252: infer - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - this may take some time...libtidl_onnxrt_EP loaded 0x38904e00
    Final number of subgraphs created are : 1, - Offloaded Nodes - 283, Total Nodes - 283
    APP: Init ... !!!
    2889.468819 s: MEM: Init ... !!!
    2889.468876 s: MEM: Initialized DMA HEAP (fd=6) !!!
    2889.469027 s: MEM: Init ... Done !!!
    2889.469054 s: IPC: Init ... !!!
    2889.514377 s: IPC: Init ... Done !!!
    REMOTE_SERVICE: Init ... !!!
    REMOTE_SERVICE: Init ... Done !!!
    2889.518294 s: GTC Frequency = 200 MHz
    APP: Init ... Done !!!
    2889.518416 s: VX_ZONE_INIT:Enabled
    2889.518431 s: VX_ZONE_ERROR:Enabled
    2889.518437 s: VX_ZONE_WARNING:Enabled
    2889.519250 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-0
    2889.519440 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-1
    2889.519603 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-2
    2889.519715 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-3
    2889.519729 s: VX_ZONE_INIT:[tivxInitLocal:136] Initialization Done !!!
    2889.522375 s: VX_ZONE_INIT:[tivxHostInitLocal:106] Initialization Done for HOST !!!
    infer : od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x64| 100%|##########|| 100/100 [00:02<00:00, 35.18it/s]
    2892.468131 s: VX_ZONE_INIT:[tivxHostDeInitLocal:120] De-Initialization Done for HOST !!!
    2892.472684 s: VX_ZONE_INIT:[tivxDeInitLocal:206] De-Initialization Done !!!
    APP: Deinit ... !!!
    REMOTE_SERVICE: Deinit ... !!!
    REMOTE_SERVICE: Deinit ... Done !!!
    2892.473414 s: IPC: Deinit ... !!!
    2892.475236 s: IPC: DeInit ... Done !!!
    2892.475281 s: MEM: Deinit ... !!!
    2892.475299 s: DDR_SHARED_MEM: Alloc's: 8 alloc's of 12939400 bytes
    2892.475308 s: DDR_SHARED_MEM: Free's : 8 free's of 12939400 bytes
    2892.475317 s: DDR_SHARED_MEM: Open's : 0 allocs of 0 bytes
    2892.475333 s: MEM: Deinit ... Done !!!
    APP: Deinit ... Done !!!

    INFO:20241011-103257: infer completed - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - 6 secLoading and preparing results...
    DONE (t=0.01s)
    creating index...
    index created!
    Running per image evaluation...
    Evaluate annotation type *bbox*
    DONE (t=0.87s).
    Accumulating evaluation results...
    DONE (t=1.27s).
    Average Precision (AP) @[ IoU=0.50:0.95 | area= all | maxDets=100 ] = 0.400
    Average Precision (AP) @[ IoU=0.50 | area= all | maxDets=100 ] = 0.546
    Average Precision (AP) @[ IoU=0.75 | area= all | maxDets=100 ] = 0.431
    Average Precision (AP) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.179
    Average Precision (AP) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.481
    Average Precision (AP) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.520
    Average Recall (AR) @[ IoU=0.50:0.95 | area= all | maxDets= 1 ] = 0.335
    Average Recall (AR) @[ IoU=0.50:0.95 | area= all | maxDets= 10 ] = 0.439
    Average Recall (AR) @[ IoU=0.50:0.95 | area= all | maxDets=100 ] = 0.444
    Average Recall (AR) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.194
    Average Recall (AR) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.503
    Average Recall (AR) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.560


    SUCCESS:20241011-103300: benchmark results - {'infer_path': 'od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx', 'accuracy_ap[.5:.95]%': 40.03901, 'accuracy_ap50%': 54.616241, 'num_subgraphs': 0, 'infer_time_core_ms': 10.721231, 'infer_time_subgraph_ms': 0.0, 'ddr_transfer_mb': 38.717056, 'perfsim_time_ms': 0.0, 'perfsim_ddr_transfer_mb': 0.0, 'perfsim_gmacs': 0.0}
    -------------------------------------------------------------------
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'configs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': './work_dirs/modelartifacts/', 'modelpackage_path': './work_dirs/modelpackage/', 'datasets_path': './dependencies/datasets', 'target_device': None, 'target_machine': 'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': None, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-8220', 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': None, 'dataset_loading': True, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': None, 'param_template_file': None, 'skip_pattern': '_package', 'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'skip_pattern', 'settings_file'], 'dataset_cache': None}
    results found for 1 models
    Report generated at ./work_dirs/modelartifacts/

  • Hi Gunter,

    I don't have the AM69A EVM/StarterKit with me right now, so I tested on AM68A instead using the precompiled model. It seems to be working on AM68A EVM. 

    1.. copied the modelartifacts link od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz.link

    from edgeai-modelzoo/modelartifacts/AM68A/8bits/

    and placed it under edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/

    These are the modifications that I did in edgeai-benchmark/settings_base.yaml:

    2. select only the model of interest instead of all the models:

    model_selection : od-8220

    3. I did the following for a quick test - just run 100 frames inference instead of all 5000 frames:

    num_frames: 100

    4. ssh into AM68A EVM, mounted edgeai-benchmark from my PC and ran the script

    5. Here is the log from the EVM/StarterKit:

    oot@am68a-sk:/mnt/edgeai-benchmark# ./run_benchmarks_evm.sh AM68A
    TARGET_SOC: AM68A
    TARGET_MACHINE: evm
    DEBUG MODE: false @ am68a-sk:5678
    Entering: ./work_dirs/modelartifacts/AM68A/8bits/ss-5710_tvmdlr_cocoseg21_edgeai-tv_deeplabv3plus_mobilenetv2_edgeailite_512x512_20210405_onnx.tar.gz.link
    run_set_target_machine.sh: line 94: cd: ./work_dirs/modelartifacts/AM68A/8bits/ss-5710_tvmdlr_cocoseg21_edgeai-tv_deeplabv3plus_mobilenetv2_edgeailite_512x512_20210405_onnx.tar.gz.link/artifacts: Not a directory
    Entering: ./work_dirs/modelartifacts/AM68A/8bits/cl-3090_tvmdlr_imagenet1k_torchvision_mobilenet_v2_tv_onnx.tar.gz.link
    run_set_target_machine.sh: line 94: cd: ./work_dirs/modelartifacts/AM68A/8bits/cl-3090_tvmdlr_imagenet1k_torchvision_mobilenet_v2_tv_onnx.tar.gz.link/artifacts: Not a directory
    Entering: ./work_dirs/modelartifacts/AM68A/8bits/od-5120_tvmdlr_coco_tf1-models_ssdlite_mobiledet_dsp_320x320_coco_20200519_tflite.tar.gz.link
    run_set_target_machine.sh: line 94: cd: ./work_dirs/modelartifacts/AM68A/8bits/od-5120_tvmdlr_coco_tf1-models_ssdlite_mobiledet_dsp_320x320_coco_20200519_tflite.tar.gz.link/artifacts: Not a directory
    TIDL_TOOLS_PATH=/mnt/edgeai-benchmark/tools/AM68A/tidl_tools
    LD_LIBRARY_PATH=/mnt/edgeai-benchmark/tools/AM68A/tidl_tools
    PYTHONPATH=:/usr/lib/python3.12/site-packages/
    ===================================================================
    argv: ['./scripts/generate_models_list.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM68A', '--models_list_file', './work_dirs/modelartifacts/benchmarks_models_list.txt', '--dataset_loading', 'False']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'configs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': './work_dirs/modelartifacts/AM68A', 'modelpackage_path': './work_dirs/modelpackage/AM68A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM68A', 'target_machine': 'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:quantization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-8220', 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': None, 'dataset_loading': False, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'models_list_file': './work_dirs/modelartifacts/benchmarks_models_list.txt', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'settings_file', 'models_list_file'], 'dataset_cache': None}
    work_dir: ./work_dirs/modelartifacts/AM68A/8bits
    Using model configs from Python module: ./configs
    1
    -------------------------------------------------------------------
    running MODEL_ID:od-8220
    argv: ['./scripts/benchmark_modelzoo.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM68A', '--run_import', 'False', '--model_selection', 'od-8220']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'configs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': './work_dirs/modelartifacts/AM68A', 'modelpackage_path': './work_dirs/modelpackage/AM68A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM68A', 'target_machine': 'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:quantization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': ['od-8220'], 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': None, 'dataset_loading': True, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'settings_file'], 'dataset_cache': None}
    work_dir: ./work_dirs/modelartifacts/AM68A/8bits
    Using model configs from Python module: ./configs

    INFO:20241011-103202: loading dataset - category:coco variant:coco

    INFO:20241011-103202: dataset exists - will reuse - ./dependencies/datasets/coco
    loading annotations into memory...
    Done (t=1.48s)
    creating index...
    index created!
    loading annotations into memory...
    Done (t=1.53s)
    creating index...
    index created!
    configs to run: ['od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx']
    number of configs: 1

    INFO:20241011-103239: starting - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    Downloading software-dl.ti.com/.../od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz to /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz
    41328640it [00:10, 3894883.00it/s]
    Extracting /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz to /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241011-103252: model_path - /mnt/edgeai-modelzoo/models/vision/detection/coco/edgeai-mmdet/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241011-103252: model_file - /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx/model/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241011-103252: quant_file - /mnt/edgeai-benchmark/work_dirs/modelartifacts/AM68A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx/model/yolox_s_lite_640x640_20220221_model_qparams.prototxt

    INFO:20241011-103252: running - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241011-103252: pipeline_config - {'task_type': 'detection', 'dataset_category': 'coco', 'calibration_dataset': <edgeai_benchmark.datasets.coco_det.COCODetection object at 0xffff7e698c80>, 'input_dataset': <edgeai_benchmark.datasets.coco_det.COCODetection object at 0xffff7e69bbc0>, 'preprocess': <edgeai_benchmark.preprocess.PreProcessTransforms object at 0xffff7e653e90>, 'session': <edgeai_benchmark.sessions.onnxrt_session.ONNXRTSession object at 0xffff7e653ef0>, 'postprocess': <edgeai_benchmark.postprocess.PostProcessTransforms object at 0xffff7e668080>, 'metric': {'label_offset_pred': {0: 1, 1: 2, 2: 3, 3: 4, 4: 5, 5: 6, 6: 7, 7: 8, 8: 9, 9: 10, 10: 11, 11: 13, 12: 14, 13: 15, 14: 16, 15: 17, 16: 18, 17: 19, 18: 20, 19: 21, 20: 22, 21: 23, 22: 24, 23: 25, 24: 27, 25: 28, 26: 31, 27: 32, 28: 33, 29: 34, 30: 35, 31: 36, 32: 37, 33: 38, 34: 39, 35: 40, 36: 41, 37: 42, 38: 43, 39: 44, 40: 46, 41: 47, 42: 48, 43: 49, 44: 50, 45: 51, 46: 52, 47: 53, 48: 54, 49: 55, 50: 56, 51: 57, 52: 58, 53: 59, 54: 60, 55: 61, 56: 62, 57: 63, 58: 64, 59: 65, 60: 67, 61: 70, 62: 72, 63: 73, 64: 74, 65: 75, 66: 76, 67: 77, 68: 78, 69: 79, 70: 80, 71: 81, 72: 82, 73: 84, 74: 85, 75: 86, 76: 87, 77: 88, 78: 89, 79: 90, 80: 91}}, 'model_info': {'metric_reference': {'accuracy_ap[.5:.95]%': 38.3}, 'model_shortlist': 10, 'compact_name': 'yolox-s-lite-mmdet-coco-640x640', 'shortlisted': True, 'recommended': True}}
    INFO:20241011-103252: infer - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - this may take some time...libtidl_onnxrt_EP loaded 0x38904e00
    Final number of subgraphs created are : 1, - Offloaded Nodes - 283, Total Nodes - 283
    APP: Init ... !!!
    2889.468819 s: MEM: Init ... !!!
    2889.468876 s: MEM: Initialized DMA HEAP (fd=6) !!!
    2889.469027 s: MEM: Init ... Done !!!
    2889.469054 s: IPC: Init ... !!!
    2889.514377 s: IPC: Init ... Done !!!
    REMOTE_SERVICE: Init ... !!!
    REMOTE_SERVICE: Init ... Done !!!
    2889.518294 s: GTC Frequency = 200 MHz
    APP: Init ... Done !!!
    2889.518416 s: VX_ZONE_INIT:Enabled
    2889.518431 s: VX_ZONE_ERROR:Enabled
    2889.518437 s: VX_ZONE_WARNING:Enabled
    2889.519250 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-0
    2889.519440 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-1
    2889.519603 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-2
    2889.519715 s: VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-3
    2889.519729 s: VX_ZONE_INIT:[tivxInitLocal:136] Initialization Done !!!
    2889.522375 s: VX_ZONE_INIT:[tivxHostInitLocal:106] Initialization Done for HOST !!!
    infer : od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x64| 100%|##########|| 100/100 [00:02<00:00, 35.18it/s]
    2892.468131 s: VX_ZONE_INIT:[tivxHostDeInitLocal:120] De-Initialization Done for HOST !!!
    2892.472684 s: VX_ZONE_INIT:[tivxDeInitLocal:206] De-Initialization Done !!!
    APP: Deinit ... !!!
    REMOTE_SERVICE: Deinit ... !!!
    REMOTE_SERVICE: Deinit ... Done !!!
    2892.473414 s: IPC: Deinit ... !!!
    2892.475236 s: IPC: DeInit ... Done !!!
    2892.475281 s: MEM: Deinit ... !!!
    2892.475299 s: DDR_SHARED_MEM: Alloc's: 8 alloc's of 12939400 bytes
    2892.475308 s: DDR_SHARED_MEM: Free's : 8 free's of 12939400 bytes
    2892.475317 s: DDR_SHARED_MEM: Open's : 0 allocs of 0 bytes
    2892.475333 s: MEM: Deinit ... Done !!!
    APP: Deinit ... Done !!!

    INFO:20241011-103257: infer completed - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - 6 secLoading and preparing results...
    DONE (t=0.01s)
    creating index...
    index created!
    Running per image evaluation...
    Evaluate annotation type *bbox*
    DONE (t=0.87s).
    Accumulating evaluation results...
    DONE (t=1.27s).
    Average Precision (AP) @[ IoU=0.50:0.95 | area= all | maxDets=100 ] = 0.400
    Average Precision (AP) @[ IoU=0.50 | area= all | maxDets=100 ] = 0.546
    Average Precision (AP) @[ IoU=0.75 | area= all | maxDets=100 ] = 0.431
    Average Precision (AP) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.179
    Average Precision (AP) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.481
    Average Precision (AP) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.520
    Average Recall (AR) @[ IoU=0.50:0.95 | area= all | maxDets= 1 ] = 0.335
    Average Recall (AR) @[ IoU=0.50:0.95 | area= all | maxDets= 10 ] = 0.439
    Average Recall (AR) @[ IoU=0.50:0.95 | area= all | maxDets=100 ] = 0.444
    Average Recall (AR) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.194
    Average Recall (AR) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.503
    Average Recall (AR) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.560


    SUCCESS:20241011-103300: benchmark results - {'infer_path': 'od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx', 'accuracy_ap[.5:.95]%': 40.03901, 'accuracy_ap50%': 54.616241, 'num_subgraphs': 0, 'infer_time_core_ms': 10.721231, 'infer_time_subgraph_ms': 0.0, 'ddr_transfer_mb': 38.717056, 'perfsim_time_ms': 0.0, 'perfsim_ddr_transfer_mb': 0.0, 'perfsim_gmacs': 0.0}
    -------------------------------------------------------------------
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'configs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': './work_dirs/modelartifacts/', 'modelpackage_path': './work_dirs/modelpackage/', 'datasets_path': './dependencies/datasets', 'target_device': None, 'target_machine': 'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': None, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-8220', 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': None, 'dataset_selection': None, 'dataset_loading': True, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': None, 'param_template_file': None, 'skip_pattern': '_package', 'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'skip_pattern', 'settings_file'], 'dataset_cache': None}
    results found for 1 models
    Report generated at ./work_dirs/modelartifacts/

  • Can you please go through above steps and see if anything is missing. Also make sure that we are not missing anything trivial. 

    1. Make sure you are indeed using r10.0 modelartifacts on r10.0 SDK

    2. Make sure you are using the modelartifacts for the right device.

    I have also looped in Rekib from my team. Hopefully we can get to the bottom of this issue soon.

  • Hi Manu,

    it is working!!

    I removed all existing tar.gz and extracted model artifacts, to only have the links in the directory, which forced the download. The branch was at r10.0, but I think the download had already happened under that r9.2 branch and it was therefore bypassing the the download.

    Now the log looks like this:

    root@am69-sk:/mnt/edgeai-benchmark# ./run_benchmarks_evm.sh AM69A
    TARGET_SOC:     AM69A
    TARGET_MACHINE: evm
    DEBUG MODE:     false @ am69-sk:5678
    TIDL_TOOLS_PATH=/mnt/edgeai-benchmark/tools/AM69A/tidl_tools
    LD_LIBRARY_PATH=/mnt/edgeai-benchmark/tools/AM69A/tidl_tools
    PYTHONPATH=:/usr/lib/python3.12/site-packages/
    ===================================================================
    argv: ['./scripts/generate_models_list.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM69A', '--models_list_file', './work_dirs/mod
    elartifacts/benchmarks_models_list.txt', '--dataset_loading', 'False']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
    onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/AM69A', 'mo
    delpackage_path': './work_dirs/modelpackage/AM69A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM69A', 'target_machine': 
    'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:qua
    ntization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 2
    00, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-822
    0', 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnx
    rt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': {'imagenet': 'imagenetv2c'}, 'dataset_selection': 'coco', 'dataset_loadi
    ng': False, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_
    models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 
    'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5, 
    'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'models_list_file': './work_dirs/modelartifacts/benchmarks_model
    s_list.txt', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibration_iterations', 'configs_path', 
    'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_machine', 'run_suffix', 'parallel_devic
    es', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing', 'detection_threshold', 'detection
    _top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_selection', 'model_shortlist', 'model
    _exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_selection', 'dataset_loading', 'confi
    g_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrite_results', 'with_udp', 'flip_test'
    , 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_depth', 'target_device_preset', 'fast_c
    alibration_factor', 'param_template_file', 'settings_file', 'models_list_file'], 'dataset_cache': None}
    work_dir: ../edgeai-modelzoo/modelartifacts/AM69A/8bits
    Using model configs from Python module: ./configs
    1
    -------------------------------------------------------------------
    running MODEL_ID:od-8220
    argv: ['./scripts/benchmark_modelzoo.py', 'settings_infer_on_evm.yaml', '--target_device', 'AM69A', '--run_import', 'False', '--model_select
    ion', 'od-8220']
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
    onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/AM69A', 'mo
    delpackage_path': './work_dirs/modelpackage/AM69A', 'datasets_path': './dependencies/datasets', 'target_device': 'AM69A', 'target_machine': 
    'evm', 'run_suffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': {'advanced_options:qua
    ntization_scale_type': 4}, 'run_import': False, 'run_inference': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 2
    00, 'detection_nms_threshold': None, 'detection_keep_top_k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': ['od-82
    20'], 'model_shortlist': None, 'model_exclusion': None, 'task_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'on
    nxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_type_dict': {'imagenet': 'imagenetv2c'}, 'dataset_selection': 'coco', 'dataset_loa
    ding': True, 'config_range': None, 'enable_logging': True, 'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental
    _models': False, 'rewrite_results': False, 'with_udp': True, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False,
     'tidl_offload': True, 'input_optimization': None, 'run_dir_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': 0.5,
     'param_template_file': None, 'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 
    'calibration_frames', 'calibration_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 
    'target_device', 'target_machine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', '
    run_inference', 'run_missing', 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', '
    num_output_frames', 'model_selection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'da
    taset_type_dict', 'dataset_selection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', '
    experimental_models', 'rewrite_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_opti
    mization', 'run_dir_tree_depth', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'settings_file'], 'dataset_cache'
    : None}
    work_dir: ../edgeai-modelzoo/modelartifacts/AM69A/8bits
    Using model configs from Python module: ./configs
    
    INFO:20241014-212407: loading dataset - category:coco variant:coco
    
    INFO:20241014-212407: dataset exists - will reuse - ./dependencies/datasets/coco
    loading annotations into memory...
    Done (t=2.09s)
    creating index...
    index created!
    loading annotations into memory...
    Done (t=1.53s)
    creating index...
    index created!
    configs to run: ['od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx']
    number of configs: 1
    
    INFO:20241014-212445: starting - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    Downloading http://software-dl.ti.com/jacinto7/esd/modelzoo/10_00_00/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lit
    e_640x640_20220221_model_onnx.tar.gz to /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x64
    0_20220221_model_onnx.tar.gz
     49%|█████████████████████████████████████████▊                                            | 20062208/41321734 [00:07<00:04, 4598309.25it/s]
     51%|███████████████████████████████████████████▋                                          | 20979712/41321734 [00:07<00:05, 3439805.66it/
     54%|██████████████████████████████████████████████▎                                       | 22241280/41321734 [00:08<00:04, 4466432.33it/
     56%|████████████████████████████████████████████████                                      | 23076864/41321734 [00:08<00:05, 3495530.01it/
     59%|██████████████████████████████████████████████████▉                                   | 24494080/41321734 [00:08<00:03, 4789226.94it/
     61%|████████████████████████████████████████████████████▊                                 | 25354240/41321734 [00:08<00:04, 3669746.92it/
     65%|████████████████████████████████████████████████████████▎                             | 27041792/41321734 [00:09<00:02, 5334501.36it/
     68%|██████████████████████████████████████████████████████████▎                           | 28016640/41321734 [00:09<00:03, 4058618.83it/
     71%|█████████████████████████████████████████████████████████████                         | 29368320/41321734 [00:09<00:03, 3579407.52it/
     75%|████████████████████████████████████████████████████████████████▎                     | 30924800/41321734 [00:10<00:02, 4906282.83it/
     77%|██████████████████████████████████████████████████████████████████▏                   | 31825920/41321734 [00:10<00:02, 3525260.63it/
     80%|████████████████████████████████████████████████████████████████████▍                 | 32907264/41321734 [00:10<00:01, 4337882.50it/
     82%|██████████████████████████████████████████████████████████████████████▏               | 33710080/41321734 [00:11<00:02, 3400147.91it/
     86%|█████████████████████████████████████████████████████████████████████████▊            | 35463168/41321734 [00:11<00:01, 5107792.38it/
     88%|███████████████████████████████████████████████████████████████████████████▊          | 36421632/41321734 [00:11<00:01, 3642275.91it/
     91%|██████████████████████████████████████████████████████████████████████████████▌       | 37756928/41321734 [00:12<00:01, 3414102.58it/
     95%|█████████████████████████████████████████████████████████████████████████████████▉    | 39387136/41321734 [00:12<00:00, 4789268.93it/
     98%|███████████████████████████████████████████████████████████████████████████████████▊  | 40296448/41321734 [00:12<00:00, 3789292.8
    41328640it [00:13, 3140090.88it/s]                                                                                                          
    Extracting /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx.tar.gz 
    to /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241014-212500: model_path - /mnt/edgeai-modelzoo/models/vision/detection/coco/edgeai-mmdet/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241014-212500: model_file - /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_202
    20221_model_onnx/model/yolox_s_lite_640x640_20220221_model.onnx
    INFO:20241014-212500: quant_file - /mnt/edgeai-modelzoo/modelartifacts/AM69A/8bits/od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_202
    20221_model_onnx/model/yolox_s_lite_640x640_20220221_model_qparams.prototxt
    
    INFO:20241014-212500: running - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx
    INFO:20241014-212500: pipeline_config - {'task_type': 'detection', 'dataset_category': 'coco', 'calibration_dataset': <edgeai_benchmark.data
    sets.coco_det.COCODetection object at 0xffff8269e000>, 'input_dataset': <edgeai_benchmark.datasets.coco_det.COCODetection object at 0xffff82
    63a990>, 'preprocess': <edgeai_benchmark.preprocess.PreProcessTransforms object at 0xffff8268b860>, 'session': <edgeai_benchmark.sessions.on
    nxrt_session.ONNXRTSession object at 0xffff8268b8c0>, 'postprocess': <edgeai_benchmark.postprocess.PostProcessTransforms object at 0xffff826
    8ba10>, 'metric': {'label_offset_pred': {0: 1, 1: 2, 2: 3, 3: 4, 4: 5, 5: 6, 6: 7, 7: 8, 8: 9, 9: 10, 10: 11, 11: 13, 12: 14, 13: 15, 14: 16
    , 15: 17, 16: 18, 17: 19, 18: 20, 19: 21, 20: 22, 21: 23, 22: 24, 23: 25, 24: 27, 25: 28, 26: 31, 27: 32, 28: 33, 29: 34, 30: 35, 31: 36, 32
    : 37, 33: 38, 34: 39, 35: 40, 36: 41, 37: 42, 38: 43, 39: 44, 40: 46, 41: 47, 42: 48, 43: 49, 44: 50, 45: 51, 46: 52, 47: 53, 48: 54, 49: 55
    , 50: 56, 51: 57, 52: 58, 53: 59, 54: 60, 55: 61, 56: 62, 57: 63, 58: 64, 59: 65, 60: 67, 61: 70, 62: 72, 63: 73, 64: 74, 65: 75, 66: 76, 67
    : 77, 68: 78, 69: 79, 70: 80, 71: 81, 72: 82, 73: 84, 74: 85, 75: 86, 76: 87, 77: 88, 78: 89, 79: 90, 80: 91}}, 'model_info': {'metric_refer
    ence': {'accuracy_ap[.5:.95]%': 38.3}, 'model_shortlist': 10, 'compact_name': 'yolox-s-lite-mmdet-coco-640x640', 'shortlisted': True, 'recom
    mended': True}}
    INFO:20241014-212500: infer  - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - this may take some time...libtidl
    _onnxrt_EP loaded 0x349adec0 
    Final number of subgraphs created are : 1, - Offloaded Nodes - 283, Total Nodes - 283 
    APP: Init ... !!!
      1069.993881 s: MEM: Init ... !!!
      1069.993930 s: MEM: Initialized DMA HEAP (fd=6) !!!
      1069.994075 s: MEM: Init ... Done !!!
      1069.994096 s: IPC: Init ... !!!
      1070.027606 s: IPC: Init ... Done !!!
    REMOTE_SERVICE: Init ... !!!
    REMOTE_SERVICE: Init ... Done !!!
      1070.036165 s: GTC Frequency = 200 MHz
    APP: Init ... Done !!!
      1070.037971 s:  VX_ZONE_INIT:Enabled
      1070.037988 s:  VX_ZONE_ERROR:Enabled
      1070.037995 s:  VX_ZONE_WARNING:Enabled
      1070.040103 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-0 
      1070.040204 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-1 
      1070.040290 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-2 
      1070.040364 s:  VX_ZONE_INIT:[tivxPlatformCreateTargetId:124] Added target MPU-3 
      1070.040374 s:  VX_ZONE_INIT:[tivxInitLocal:136] Initialization Done !!!
      1070.043042 s:  VX_ZONE_INIT:[tivxHostInitLocal:106] Initialization Done for HOST !!!
    infer : od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x64| 100%|##########|| 100/100 [00:03<00:00, 25.29it/s]
      1074.108201 s:  VX_ZONE_INIT:[tivxHostDeInitLocal:120] De-Initialization Done for HOST !!!
      1074.112758 s:  VX_ZONE_INIT:[tivxDeInitLocal:206] De-Initialization Done !!!
    APP: Deinit ... !!!
    REMOTE_SERVICE: Deinit ... !!!
    REMOTE_SERVICE: Deinit ... Done !!!
      1074.113627 s: IPC: Deinit ... !!!
      1074.114322 s: IPC: DeInit ... Done !!!
      1074.114343 s: MEM: Deinit ... !!!
      1074.114355 s: DDR_SHARED_MEM: Alloc's: 8 alloc's of 13225096 bytes 
      1074.114362 s: DDR_SHARED_MEM: Free's : 8 free's  of 13225096 bytes 
      1074.114369 s: DDR_SHARED_MEM: Open's : 0 allocs  of 0 bytes 
      1074.114380 s: MEM: Deinit ... Done !!!
    APP: Deinit ... Done !!!
    
    INFO:20241014-212508: infer completed  - od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx - 7 secLoading and prepar
    ing results...
    DONE (t=0.01s)
    creating index...
    index created!
    Running per image evaluation...
    Evaluate annotation type *bbox*
    DONE (t=0.81s).
    Accumulating evaluation results...
    DONE (t=1.18s).
     Average Precision  (AP) @[ IoU=0.50:0.95 | area=   all | maxDets=100 ] = 0.400
     Average Precision  (AP) @[ IoU=0.50      | area=   all | maxDets=100 ] = 0.546
     Average Precision  (AP) @[ IoU=0.75      | area=   all | maxDets=100 ] = 0.431
     Average Precision  (AP) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.179
     Average Precision  (AP) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.481
     Average Precision  (AP) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.520
     Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets=  1 ] = 0.335
     Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets= 10 ] = 0.439
     Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets=100 ] = 0.444
     Average Recall     (AR) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.194
     Average Recall     (AR) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.503
     Average Recall     (AR) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.560
    
    
    SUCCESS:20241014-212510: benchmark results - {'infer_path': 'od-8220_onnxrt_coco_edgeai-mmdet_yolox_s_lite_640x640_20220221_model_onnx', 'ac
    curacy_ap[.5:.95]%': 40.03901, 'accuracy_ap50%': 54.616241, 'num_subgraphs': 0, 'infer_time_core_ms': 11.123727, 'infer_time_subgraph_ms': 0
    .0, 'ddr_transfer_mb': 37.148828, 'perfsim_time_ms': 0.0, 'perfsim_ddr_transfer_mb': 0.0, 'perfsim_gmacs': 0.0}
    -------------------------------------------------------------------
    settings: {'include_files': None, 'pipeline_type': 'accuracy', 'num_frames': 100, 'calibration_frames': 25, 'calibration_iterations': 25, 'c
    onfigs_path': './configs', 'models_path': '../edgeai-modelzoo/models', 'modelartifacts_path': '../edgeai-modelzoo/modelartifacts/', 'modelpa
    ckage_path': './work_dirs/modelpackage/', 'datasets_path': './dependencies/datasets', 'target_device': None, 'target_machine': 'evm', 'run_s
    uffix': None, 'parallel_devices': None, 'parallel_processes': None, 'tensor_bits': 8, 'runtime_options': None, 'run_import': False, 'run_inf
    erence': True, 'run_missing': True, 'detection_threshold': 0.3, 'detection_top_k': 200, 'detection_nms_threshold': None, 'detection_keep_top
    _k': None, 'save_output': False, 'num_output_frames': 50, 'model_selection': 'od-8220', 'model_shortlist': None, 'model_exclusion': None, 't
    ask_selection': None, 'runtime_selection': None, 'session_type_dict': {'onnx': 'onnxrt', 'tflite': 'tflitert', 'mxnet': 'tvmdlr'}, 'dataset_
    type_dict': {'imagenet': 'imagenetv2c'}, 'dataset_selection': 'coco', 'dataset_loading': True, 'config_range': None, 'enable_logging': True,
     'verbose': False, 'capture_log': False, 'additional_models': False, 'experimental_models': False, 'rewrite_results': False, 'with_udp': Tru
    e, 'flip_test': False, 'model_transformation_dict': None, 'report_perfsim': False, 'tidl_offload': True, 'input_optimization': None, 'run_di
    r_tree_depth': None, 'target_device_preset': True, 'fast_calibration_factor': None, 'param_template_file': None, 'skip_pattern': '_package',
     'settings_file': 'settings_infer_on_evm.yaml', 'basic_keys': ['include_files', 'pipeline_type', 'num_frames', 'calibration_frames', 'calibr
    ation_iterations', 'configs_path', 'models_path', 'modelartifacts_path', 'modelpackage_path', 'datasets_path', 'target_device', 'target_mach
    ine', 'run_suffix', 'parallel_devices', 'parallel_processes', 'tensor_bits', 'runtime_options', 'run_import', 'run_inference', 'run_missing'
    , 'detection_threshold', 'detection_top_k', 'detection_nms_threshold', 'detection_keep_top_k', 'save_output', 'num_output_frames', 'model_se
    lection', 'model_shortlist', 'model_exclusion', 'task_selection', 'runtime_selection', 'session_type_dict', 'dataset_type_dict', 'dataset_se
    lection', 'dataset_loading', 'config_range', 'enable_logging', 'verbose', 'capture_log', 'additional_models', 'experimental_models', 'rewrit
    e_results', 'with_udp', 'flip_test', 'model_transformation_dict', 'report_perfsim', 'tidl_offload', 'input_optimization', 'run_dir_tree_dept
    h', 'target_device_preset', 'fast_calibration_factor', 'param_template_file', 'skip_pattern', 'settings_file'], 'dataset_cache': None}
    results found for 1 models
    Report generated at ../edgeai-modelzoo/modelartifacts/
    -------------------------------------------------------------------
    

    With this the inference time for the od-8220 model is

    'infer_time_core_ms': 11.123727

    Regards,

    --Gunter