123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174 |
- nohup: ignoring input
- [W Context.cpp:69] Warning: torch.set_deterministic is in beta, and its design and functionality may change in the future. (function operator())
- [36m[15 03:44:50 <frozen super_pulsar.proto.configuration_super_pulsar_manip>:39] [0m[1;31mWRN migrate all stand-alone args into a single task[0m
- [36m[15 03:44:50 <frozen super_pulsar.proto.configuration_super_pulsar_manip>:159] [0mset task task_0's 0th input model path as /root/axera/axera-quan-hjj/model/yolov8n-pose.onnx
- [36m[15 03:44:50 <frozen super_pulsar.proto.configuration_super_pulsar_manip>:178] [0mset task task_0's 0th output model path as /root/axera/axera-quan-hjj/joint/yolov8n-pose.joint
- [36m[15 03:44:50 <frozen super_pulsar.proto.configuration_super_pulsar_manip>:297] [0mset task task_0's pulsar_conf.output_dir as /root/axera/axera-quan-hjj
- /opt/venv/lib/python3.6/site-packages/torch/cuda/__init__.py:52: UserWarning: CUDA initialization: Found no NVIDIA driver on your system. Please check that you have an NVIDIA GPU and installed a driver from http://www.nvidia.com/Download/index.aspx (Triggered internally at /pytorch/c10/cuda/CUDAFunctions.cpp:100.)
- return torch._C._cuda_getDeviceCount() > 0
- [36m[15 03:44:51 <frozen super_pulsar.func_wrappers.wrapper_pulsar_build>:17] [0mplanning task task_0
- [36m[15 03:44:51 <frozen super_pulsar.func_wrappers.pulsar_build.neuwizard_step>:459] [0m[1;31mWRN affine_preprocess at QAT model compiling is deprecated, insert enforce_integers at front, please use scale_to_integers instead.[0m
- [36m[15 03:44:51 <frozen super_pulsar.func_wrappers.wrapper_pulsar_build>:340] [0m################## Running task task_0 ##################
- [36m[15 03:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:30] [0mpython3 /root/python_modules/super_pulsar/super_pulsar/toolchain_wrappers/wrapper_neuwizard.py --config /tmp/tmppybjgzd8.prototxt
- [36m[15 03:44:52 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] [W Context.cpp:69] Warning: torch.set_deterministic is in beta, and its design and functionality may change in the future. (function operator())[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] ONNX Model Version 12 for "/root/axera/axera-quan-hjj/model/yolov8n-pose.onnx"[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning load step finished; elapsed time: 0.01s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step finished; elapsed time: 0.01s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "native" finished; elapsed time: 0.18s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "native_no_bn" finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "pretransformed" finished; elapsed time: 0.33s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning calibrate step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "transformed" finished; elapsed time: 21.52s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "posttransformed" finished; elapsed time: 1.51s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "magma" finished; elapsed time: 0.45s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "magma_validified" finished; elapsed time: 0.12s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning transform step to "lava_with_rtv" finished; elapsed time: 2.70s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning dump_joint_model step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning evaluate step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning ir_bit_macs step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning ir_bit_float_params step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Planning ir_bit_quantized_params step finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Loading model finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "onnx_step_1" finished; elapsed time: 0.01s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "onnx_step_2" finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "onnx" finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "native" finished; elapsed time: 0.08s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "native_no_bn" finished; elapsed time: 0.00s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "pretransformed" finished; elapsed time: 0.12s[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] /opt/venv/lib/python3.6/site-packages/torch/cuda/__init__.py:52: UserWarning: CUDA initialization: Found no NVIDIA driver on your system. Please check that you have an NVIDIA GPU and installed a driver from http://www.nvidia.com/Download/index.aspx (Triggered internally at /pytorch/c10/cuda/CUDAFunctions.cpp:100.)[0m
- [36m[15 03:45:20 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] return torch._C._cuda_getDeviceCount() > 0[0m
- [36m[15 03:47:55 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Calibrating finished; elapsed time: 154.35s[0m
- [36m[15 03:47:55 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Recalibrating for op_267_FeatureQuantization_Global_Backward, op_266:cat is missing[0m
- [36m[15 04:21:16 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Recalibrating for op_311_FeatureQuantization_Global_Backward, op_310:cat is missing[0m
- [36m[15 05:12:19 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Recalibrating for op_333_FeatureQuantization_Global_Backward, op_332:cat is missing[0m
- [36m[15 06:02:36 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Recalibrating for op_380_FeatureQuantization_Global_Backward, op_379:cat is missing[0m
- [36m[15 06:53:01 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Recalibrating for op_402_FeatureQuantization_Global_Backward, op_401:cat is missing[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "transformed" finished; elapsed time: 14206.47s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "posttransformed" finished; elapsed time: 0.63s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "magma" finished; elapsed time: 0.21s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "magma_validified" finished; elapsed time: 0.04s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "lava_with_rtv" finished; elapsed time: 1.31s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Dynamically planning transform step to "lava" finished; elapsed time: 0.01s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "lava" dynamically finished; elapsed time: 0.02s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Dynamically planning transform step to "lava_onnx" finished; elapsed time: 0.13s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "lava_onnx" dynamically finished; elapsed time: 0.18s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Dynamically planning transform step to "lava_onnx_axe" finished; elapsed time: 0.01s[0m
- [36m[15 07:44:43 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Transforming to "lava_onnx_axe" dynamically finished; elapsed time: 0.02s[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] /root/python_modules/neuwizard-latest/neuwizard/operators/lava/AX620/Conv2d.py:141: UserWarning: The given NumPy array is not writeable, and PyTorch does not support non-writeable tensors. This means you can write to the underlying (supposedly non-writeable) NumPy array using the tensor. You may want to copy the array to protect its data or make it writeable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at /pytorch/torch/csrc/utils/tensor_numpy.cpp:141.)[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Joint model dumpped as "/root/axera/axera-quan-hjj/joint/model.lava_joint"[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Dumping Joint Model finished; elapsed time: 6.19s[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Evaluation is not performed.[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Evaluating finished; elapsed time: 0.00s[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Overview Table of Bit MACs[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] | Domain | native | pretransformed | transformed | posttransformed | magma | lava |[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] |----------|----------|------------------|---------------|-------------------|---------|--------|[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] | Bit MACs | 294G | 299G | 303G | 340G | 317G | 328G |[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Bit MACs measurement for each domain finished; elapsed time: 0.12s[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Overview Table of parameter size[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] | Domain | native | pretransformed | transformed | posttransformed | magma | lava |[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] |----------------------|----------|------------------|---------------|-------------------|---------|--------|[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] | Parameter Size(bits) | 105M | 107M | 108M | 115M | 115M | 144M |[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Float Parameter size measurement for each domain finished; elapsed time: 0.20s[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Overview Table of parameter size[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] | Domain | native | pretransformed | transformed | posttransformed | magma | lava |[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] |----------------------|----------|------------------|---------------|-------------------|---------|--------|[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] | Parameter Size(bits) | 26M | 27M | 27M | 29M | 28M | 29M |[0m
- [36m[15 07:44:51 <frozen super_pulsar.toolchain_wrappers.wrapper_neuwizard>:36] [0m[32mDBG [neuwizard] Quantized Parameter size measurement for each domain finished; elapsed time: 0.40s[0m
- [36m[15 07:44:55 <frozen super_pulsar.toolchain_wrappers.wrapper_toolchain>:535] [0m[32mDBG working in "/root/tmp_45ri310"[0m
- [36m[15 07:44:55 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:227] [0mpython3 pulsar.py gen /root/tmp_45ri310/part_0.lava/part_0.lava env/ax620a_virtual_111_config.ini -b 1 -pe 16 --times_thres 0 --job_stealing 3 --checkall --param_compress --continuous_input --no_sim --hyper_params run_cf.wait_mode=True
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] inference_report.log:[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:-------------------------|:-----------------------------|:-------------|:-------------------|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:---------------|:-----------------|:--------------|:--------------|:------------|:--------------|:----------------|:-------------------|:----------------|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:-----------------------|:-----------------|:------------------|:------------------|:--------------------|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:-----------------------|:-----------------|:--------------------|:--------------------|:--------------------|:------------------|:-----------------|:--------------|:-------------|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] profile stream EU: ld/st_ratio might include ringbuf/linebuf/feature_swap parts; mv_ratio migth have ringbuf part.[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:--------------------|-----------:|:-------------|:-----------------|:---------------|:----------------------|:---------------|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:---------------------------------------------|:----------------|:-----------------------|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:-----------|-----------:|----------:|:--------|-------:|----------:|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] inference: 16.8 ms, 59.59 fps[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] qps = fps * batch_size = 59.59[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] simulated fps is based on DDR_BW: 1.59 GB/s[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] DDR IO stats:[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] ideal_input_data_size: 4441088 Byte,[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] ideal_output_data_size: 3897600 Byte,[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] extra_mid_io_data_size: 5366528 Byte,[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] total_io_data_size: 13705216 Byte[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] MAC per inference: 5119759360 MAC@int8[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] MAC utils: 33.10 %[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] commit_id:[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] |:----------------------------------------------|-----------:|:-------------|[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] subgraph num: 5[0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] [0m
- [36m[15 07:49:01 <frozen super_pulsar.toolchain_wrappers.wrapper_pulsar_compiler>:250] [0m[32mDBG [pulsar] pulsar.py totally used 245s[0m
- [36m[15 07:49:20 <frozen super_pulsar.toolchain_wrappers.wrapper_toolchain>:582] [0mFile saved: /root/axera/axera-quan-hjj/joint/yolov8n-pose.joint
- [36m[15 07:49:20 <frozen super_pulsar.toolchain_wrappers.wrapper_toolchain>:587] [0m[32mDBG cleared /root/tmp_45ri310[0m
- [0;32m| Pre_alloc OCM | linebuffer(may SWAP later) | ringbuffer | parameter |[0m
- [0;32m| size(ratio of whole OCM) | 72960(3.5)% | 0(0.0)% | 112128(5.3)% |[0m
- [0;32m| range | (1912064, 1985024) | (None, None) | (1985024, 2097152) |[0m
- [0;32m| profile conv | work_cyc | linebuf | warmup_tail | core_idle | io_idle | stride2_idle | standalone_fetch | MAC |[0m
- [0;32m| ratio in conv | 6977493 (100.0%) | 167731 (2.4%) | 260365 (3.7%) | 0 (0.0%) | 180533 (2.6%) | 1499023 (21.5%) | 285 (0.0%) | 4444235 (63.7%) |[0m
- [0;32m| profile ideal DDR_IO | min_io_sum | min_params_read | min_inputs_read | min_outputs_write |[0m
- [0;32m| DDR IO size (Byte) | 8338688 (100.0%) | 4031488 (48.3%) | 409600 (4.9%) | 3897600 (46.7%) |[0m
- [0;32m| profile extra DDR_IO | extra_ddr_io | extra_params_read | extra_inputs_read | extra_outputs_wrt | extra_swap_read | extra_swap_wrt | ddr_rb_read | ddr_rb_wrt |[0m
- [0;32m| DDR IO size (Byte) | 5366528 (100.0%) | 2499328 (46.6%) | 1484800 (27.7%) | 1382400 (25.8%) | 0 (0.0%) | 0 (0.0%) | 0 (0.0%) | 0 (0.0%) |[0m
- [0;32m| profile stream EU | work_cyc | ld_ratio | ld_param_ratio | mv_ratio | mv_linebuffer_ratio | st_ratio |[0m
- [0;32m| teng | 11685635 | 958075(8.2%) | 3473475(29.7%) | 4462406(38.2%) | 126068(1.1%) | 2665610(22.8%) |[0m
- [0;32m| breakdown of mv_ratio in profile stream EU | teng | all_eus with mv-cmds |[0m
- [0;32m| total_cyc_num | 4462406(100.0%) | 4462406(100.0%) |[0m
- [0;32m| mv,affine,unpack_lsb | 2099343(47.0%) | 2099343(47.0%) |[0m
- [0;32m| weight0_mode,convNxM,mode23,nopad | 729952(16.4%) | 729952(16.4%) |[0m
- [0;32m| mv,subtensor | 541404(12.1%) | 541404(12.1%) |[0m
- [0;32m| mv,concat_c | 291234(6.5%) | 291234(6.5%) |[0m
- [0;32m| mv_patch | 262377(5.9%) | 262377(5.9%) |[0m
- [0;32m| weight0_mode,convNxM,mode20,nopad | 214922(4.8%) | 214922(4.8%) |[0m
- [0;32m| mv,padding_ch | 175951(3.9%) | 175951(3.9%) |[0m
- [0;32m| mv,upsample | 125316(2.8%) | 125316(2.8%) |[0m
- [0;32m| mv,padding | 21678(0.5%) | 21678(0.5%) |[0m
- [0;32m| revert_split | 229(0.0%) | 229(0.0%) |[0m
- [0;32m| EU | work_cyc | tot_cyc | ratio | fps | fps_bnd |[0m
- [0;32m| conv-1core | 6977494 | 13425465 | 51.0% | 59.590 | 114.650 |[0m
- [0;32m| teng | 11685635 | 13425465 | 87.0% | 59.590 | 68.460 |[0m
- [0;32m| breakdown of cmds_num for each op | cmds_num | percentage |[0m
- [0;32m| mv,affine,unpack_lsb | 1478 | 28.63% |[0m
- [0;32m| weight0_mode,mode23 | 1394 | 27.00% |[0m
- [0;32m| weight0_mode,mode23,nopad | 398 | 7.71% |[0m
- [0;32m| weight0_mode,convNxM,mode23,nopad | 328 | 6.35% |[0m
- [0;32m| pool,weight0_mode,mode20,conv_align,subtensor | 288 | 5.58% |[0m
- [0;32m| weight0_mode,mode20 | 220 | 4.26% |[0m
- [0;32m| mv,subtensor | 211 | 4.09% |[0m
- [0;32m| weight0_mode,convNxM,mode20,nopad | 144 | 2.79% |[0m
- [0;32m| revert_split | 138 | 2.67% |[0m
- [0;32m| weight0_mode,convNxM,mode26,nopad | 132 | 2.56% |[0m
- [0;32m| mv,concat_c | 99 | 1.92% |[0m
- [0;32m| pool,weight0_mode,mode20,subtensor | 96 | 1.86% |[0m
- [0;32m| weight0_mode,mode20,nopad | 94 | 1.82% |[0m
- [0;32m| mv,upsample | 49 | 0.95% |[0m
- [0;32m| mv,padding_ch | 47 | 0.91% |[0m
- [0;32m| mv_patch | 30 | 0.58% |[0m
- [0;32m| yuv42xto444,yuv2bgr0 | 11 | 0.21% |[0m
- [0;32m| mv,padding | 6 | 0.12% |[0m
- [0;32m| total_num | 5163 | 100% |[0m
- [34m07:49:19 [I]final_check: FINAL_CHECK: output op_1119 check successed![0m
- [34m07:49:19 [I]final_check: FINAL_CHECK: output op_1120 check successed![0m
- [34m07:49:19 [I]final_check: FINAL_CHECK: output op_1121 check successed![0m
- [34m07:49:19 [I]final_check: FINAL_CHECK: output op_1500 check successed![0m
- [34m07:49:19 [I]final_check: FINAL_CHECK: output op_1502 check successed![0m
- [34m07:49:19 [I]final_check: FINAL_CHECK: output op_1504 check successed![0m
|