iswaalex commited on
Commit
d5c9c7a
·
verified ·
1 Parent(s): c8ca13d

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_119.bin +3 -0
  2. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_12.bin +3 -0
  3. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_120.bin +3 -0
  4. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_121.bin +3 -0
  5. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_122.bin +3 -0
  6. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_123.bin +3 -0
  7. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_124.bin +3 -0
  8. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_125.bin +3 -0
  9. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_126.bin +3 -0
  10. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_127.bin +3 -0
  11. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_128.bin +3 -0
  12. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_129.bin +3 -0
  13. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_13.bin +3 -0
  14. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_130.bin +3 -0
  15. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_133.bin +3 -0
  16. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_134.bin +3 -0
  17. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/Makefile +34 -0
  18. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper.cpp +3 -0
  19. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_analysis.json +0 -0
  20. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_dependence_guidance.json +1607 -0
  21. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_results.json +640 -0
  22. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_spec.json +50 -0
  23. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper.cpp +3 -0
  24. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_analysis.json +435 -0
  25. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_dependence_guidance.json +403 -0
  26. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_results.json +331 -0
  27. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_spec.json +114 -0
  28. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper.cpp +3 -0
  29. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_analysis.json +278 -0
  30. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_dependence_guidance.json +158 -0
  31. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_results.json +176 -0
  32. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_spec.json +66 -0
  33. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/pm_reload_analysis0_guidance.json +90 -0
  34. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.# +2 -0
  35. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.## +2 -0
  36. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.calltree +186 -0
  37. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.cmic2 +0 -0
  38. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.cmico +1 -0
  39. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.lst +0 -0
  40. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.map +568 -0
  41. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.o.lst +0 -0
  42. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.sdr +164 -0
  43. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.srv +0 -0
  44. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/pm_reload_analysis0.log +0 -0
  45. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/scripts/pm_reload_analysis0.bcf +11 -0
  46. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/scripts/pm_reload_analysis0.prx +13 -0
  47. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/src/pm_reload_analysis0.cc +131 -0
  48. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/timestamped_log/pm_reload_analysis0.log +0 -0
  49. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/xlopt.log +623 -0
  50. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/ps/c_rts/aie_control.cpp +293 -0
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1d9a436fa9741688edb3f6df0e6d9b825832bedf41161bd734fe165d752a83d
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10d2066bccb121517c6b4d28200bc0597bc7bbf83f16edd1a4319af9aed0028e
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:478d081156bfda6633592671c628bbafad86a6610dd3b13d0377d30ab15f7038
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:123e30415aba5df1803a236518436c196433223de867d613b5d677d22ffbab9a
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9cb44904cddab76168851801794dd62149f3293c61d89d395516def1168b6d3
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51a5d087b214a6996037451e928946277a3639f64111929703839fc43a79addb
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5a73e4da4d2bed15b96c8157fb7e388578bdff5031935c95c316ccf8ac954b6
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f619e69fde91b471157ec9c346b4db36e4e60abab07a18bd4603d963745bf305
3
+ size 376
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26ea9bb127fbe20d90c3b632cbb2518f492b1ed7feefebc9b04a2c360b570c36
3
+ size 756
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:403a029188e743f7f1814a2d4703915229d5918c8dff3a3659c4bf467f7374da
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20f981486199a1fd39c8e1b9bc35f9e94cfc370e6f9118356c998a6a65b627a5
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4397744f8a9cfc47351c46cb8af4fb81bb0b7ae8c0344bb48c0ec79b652a662d
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8f934e3c8eff7f247501faf863a7a5eb40acf737e1e2c4aa6d334bbd3df3810
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3bdc639c33344b53f4bca60e29da64d4c1b477a8cf6c9a830b7c6fb40e96e85
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20f981486199a1fd39c8e1b9bc35f9e94cfc370e6f9118356c998a6a65b627a5
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4397744f8a9cfc47351c46cb8af4fb81bb0b7ae8c0344bb48c0ec79b652a662d
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/Makefile ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ .PHONY: all i719_wrap_transpose4d_adf_wrapper.rule i802_wrap_resize_adf_wrapper.rule i852_wrap_slice_adf_wrapper.rule i897_wrap_concat_adf_wrapper.rule i1009_wrap_resize_adf_wrapper.rule i1100_superkernels.rule clean
2
+
3
+ ifeq ($(XILINX_VITIS_AIETOOLS),)
4
+ XILINX_VITIS_AIETOOLS:=${XILINX_VITIS}/aietools
5
+ endif
6
+ ifeq ($(CARDANO_AIE_ARCH_MODEL_DIR),)
7
+ CARDANO_AIE_ARCH_MODEL_DIR := ${XILINX_VITIS_AIETOOLS}/data/aie2p/lib
8
+ endif
9
+ XCHESSCC := xchesscc -aiearch aie2p
10
+
11
+ INCLUDE_PATH := -I ../../.. -I ${XILINX_VITIS_AIETOOLS}/include -I /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I /usr/local/lib/python3.10/dist-packages/include/aie_api -I /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I /usr/local/lib/python3.10/dist-packages/vitis_mllib -I /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I ${CARDANO_AIE_ARCH_MODEL_DIR}/runtime_cxx/libcxx-lite/include -I ${CARDANO_AIE_ARCH_MODEL_DIR}/runtime_cxx/libs/libcxx-9.0.0/include-lite -I ${CARDANO_AIE_ARCH_MODEL_DIR}/runtime/include
12
+
13
+ all: i719_wrap_transpose4d_adf_wrapper.rule i802_wrap_resize_adf_wrapper.rule i852_wrap_slice_adf_wrapper.rule i897_wrap_concat_adf_wrapper.rule i1009_wrap_resize_adf_wrapper.rule i1100_superkernels.rule
14
+
15
+ i719_wrap_transpose4d_adf_wrapper.rule:
16
+ ${XCHESSCC} +f +s -p me -P ${CARDANO_AIE_ARCH_MODEL_DIR} +Wllvm,-O2,-fno-jump-tables,-fno-discard-value-names,-Xclang,-chess-only-info-critical-passes,-g -D__AIENGINE__ -D__AIE_ARCH__=21 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR ${INCLUDE_PATH} /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i719_wrap_transpose4d_adf_wrapper.cpp -o i719_wrap_transpose4d_adf_wrapper.ll
17
+
18
+ i802_wrap_resize_adf_wrapper.rule:
19
+ ${XCHESSCC} +f +s -p me -P ${CARDANO_AIE_ARCH_MODEL_DIR} +Wllvm,-O2,-fno-jump-tables,-fno-discard-value-names,-Xclang,-chess-only-info-critical-passes,-g -D__AIENGINE__ -D__AIE_ARCH__=21 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR ${INCLUDE_PATH} /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper.cpp -o i802_wrap_resize_adf_wrapper.ll
20
+
21
+ i852_wrap_slice_adf_wrapper.rule:
22
+ ${XCHESSCC} +f +s -p me -P ${CARDANO_AIE_ARCH_MODEL_DIR} +Wllvm,-O2,-fno-jump-tables,-fno-discard-value-names,-Xclang,-chess-only-info-critical-passes,-g -D__AIENGINE__ -D__AIE_ARCH__=21 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR ${INCLUDE_PATH} /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper.cpp -o i852_wrap_slice_adf_wrapper.ll
23
+
24
+ i897_wrap_concat_adf_wrapper.rule:
25
+ ${XCHESSCC} +f +s -p me -P ${CARDANO_AIE_ARCH_MODEL_DIR} +Wllvm,-O2,-fno-jump-tables,-fno-discard-value-names,-Xclang,-chess-only-info-critical-passes,-g -D__AIENGINE__ -D__AIE_ARCH__=21 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR ${INCLUDE_PATH} /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper.cpp -o i897_wrap_concat_adf_wrapper.ll
26
+
27
+ i1009_wrap_resize_adf_wrapper.rule:
28
+ ${XCHESSCC} +f +s -p me -P ${CARDANO_AIE_ARCH_MODEL_DIR} +Wllvm,-O2,-fno-jump-tables,-fno-discard-value-names,-Xclang,-chess-only-info-critical-passes,-g -D__AIENGINE__ -D__AIE_ARCH__=21 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR ${INCLUDE_PATH} /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i1009_wrap_resize_adf_wrapper.cpp -o i1009_wrap_resize_adf_wrapper.ll
29
+
30
+ i1100_superkernels.rule:
31
+ ${XCHESSCC} +f +s -p me -P ${CARDANO_AIE_ARCH_MODEL_DIR} +Wllvm,-O2,-fno-jump-tables,-fno-discard-value-names,-Xclang,-chess-only-info-critical-passes,-g -D__AIENGINE__ -D__AIE_ARCH__=21 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR ${INCLUDE_PATH} /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend/superkernels.cpp -o i1100_superkernels.ll
32
+
33
+ clean:
34
+ rm -rf i719_wrap_transpose4d_adf_wrapper.ll i802_wrap_resize_adf_wrapper.ll i852_wrap_slice_adf_wrapper.ll i897_wrap_concat_adf_wrapper.ll i1009_wrap_resize_adf_wrapper.ll i1100_superkernels.ll
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper.cpp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ #include "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp"
2
+ template void mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 0>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16]);
3
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_analysis.json ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_dependence_guidance.json ADDED
@@ -0,0 +1,1607 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "DependenceAnalysisHints": [
3
+ {
4
+ "FunctionName": "void mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, 1, 0, 0>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [16])",
5
+ "Var1": "src_ptr",
6
+ "ArgIndex1": "NotArgIndex",
7
+ "Var2": "arrayidx",
8
+ "ArgIndex2": "NotArgIndex"
9
+ },
10
+ {
11
+ "FunctionName": "void mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, 1, 0, 0>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [16])",
12
+ "Var1": "i",
13
+ "ArgIndex1": "NotArgIndex",
14
+ "Var2": "arrayidx",
15
+ "ArgIndex2": "NotArgIndex"
16
+ },
17
+ {
18
+ "FunctionName": "void mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, 1, 0, 0>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [16])",
19
+ "Var1": "layer_params.addr",
20
+ "ArgIndex1": "1",
21
+ "Var2": "arrayidx10",
22
+ "ArgIndex2": "NotArgIndex"
23
+ },
24
+ {
25
+ "FunctionName": "void mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, 1, 0, 0>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [16])",
26
+ "Var1": "layer_params.addr",
27
+ "ArgIndex1": "1",
28
+ "Var2": "arrayidx33",
29
+ "ArgIndex2": "NotArgIndex"
30
+ },
31
+ {
32
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
33
+ "Var1": "param.addr",
34
+ "ArgIndex1": "1",
35
+ "Var2": "kernel_ofm_width",
36
+ "ArgIndex2": "NotArgIndex"
37
+ },
38
+ {
39
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
40
+ "Var1": "param.addr",
41
+ "ArgIndex1": "1",
42
+ "Var2": "kernel_ofm_height",
43
+ "ArgIndex2": "NotArgIndex"
44
+ },
45
+ {
46
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
47
+ "Var1": "param.addr",
48
+ "ArgIndex1": "1",
49
+ "Var2": "step_w7",
50
+ "ArgIndex2": "NotArgIndex"
51
+ },
52
+ {
53
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
54
+ "Var1": "param.addr",
55
+ "ArgIndex1": "1",
56
+ "Var2": "step_h8",
57
+ "ArgIndex2": "NotArgIndex"
58
+ },
59
+ {
60
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
61
+ "Var1": "param.addr",
62
+ "ArgIndex1": "1",
63
+ "Var2": "offset_scale_height",
64
+ "ArgIndex2": "NotArgIndex"
65
+ },
66
+ {
67
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
68
+ "Var1": "param.addr",
69
+ "ArgIndex1": "1",
70
+ "Var2": "offset_scale_width",
71
+ "ArgIndex2": "NotArgIndex"
72
+ },
73
+ {
74
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
75
+ "Var1": "param.addr",
76
+ "ArgIndex1": "1",
77
+ "Var2": "overlay_rows",
78
+ "ArgIndex2": "NotArgIndex"
79
+ },
80
+ {
81
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
82
+ "Var1": "param.addr",
83
+ "ArgIndex1": "1",
84
+ "Var2": "kernel_ifm_width",
85
+ "ArgIndex2": "NotArgIndex"
86
+ },
87
+ {
88
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
89
+ "Var1": "param.addr",
90
+ "ArgIndex1": "1",
91
+ "Var2": "offset_idx_out_height12",
92
+ "ArgIndex2": "NotArgIndex"
93
+ },
94
+ {
95
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
96
+ "Var1": "param.addr",
97
+ "ArgIndex1": "1",
98
+ "Var2": "offset_idx_out_width14",
99
+ "ArgIndex2": "NotArgIndex"
100
+ },
101
+ {
102
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
103
+ "Var1": "param.addr",
104
+ "ArgIndex1": "1",
105
+ "Var2": "offset_idx_in_height16",
106
+ "ArgIndex2": "NotArgIndex"
107
+ },
108
+ {
109
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
110
+ "Var1": "param.addr",
111
+ "ArgIndex1": "1",
112
+ "Var2": "offset_idx_in_width19",
113
+ "ArgIndex2": "NotArgIndex"
114
+ },
115
+ {
116
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
117
+ "Var1": "param.addr",
118
+ "ArgIndex1": "1",
119
+ "Var2": "kernel_ofm_width23",
120
+ "ArgIndex2": "NotArgIndex"
121
+ },
122
+ {
123
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
124
+ "Var1": "param.addr",
125
+ "ArgIndex1": "1",
126
+ "Var2": "kernel_ofm_height26",
127
+ "ArgIndex2": "NotArgIndex"
128
+ },
129
+ {
130
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
131
+ "Var1": "param.addr",
132
+ "ArgIndex1": "1",
133
+ "Var2": "total_ifm_height28",
134
+ "ArgIndex2": "NotArgIndex"
135
+ },
136
+ {
137
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
138
+ "Var1": "param.addr",
139
+ "ArgIndex1": "1",
140
+ "Var2": "total_ifm_width30",
141
+ "ArgIndex2": "NotArgIndex"
142
+ },
143
+ {
144
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
145
+ "Var1": "y_idx_vect",
146
+ "ArgIndex1": "NotArgIndex",
147
+ "Var2": "x_idx_vect",
148
+ "ArgIndex2": "NotArgIndex"
149
+ },
150
+ {
151
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
152
+ "Var1": "tmp",
153
+ "ArgIndex1": "NotArgIndex",
154
+ "Var2": "y_idx_vect",
155
+ "ArgIndex2": "NotArgIndex"
156
+ },
157
+ {
158
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
159
+ "Var1": "tmp36",
160
+ "ArgIndex1": "NotArgIndex",
161
+ "Var2": "x_idx_vect",
162
+ "ArgIndex2": "NotArgIndex"
163
+ },
164
+ {
165
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
166
+ "Var1": "tmp49",
167
+ "ArgIndex1": "NotArgIndex",
168
+ "Var2": "y_idx_vect",
169
+ "ArgIndex2": "NotArgIndex"
170
+ },
171
+ {
172
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
173
+ "Var1": "tmp50",
174
+ "ArgIndex1": "NotArgIndex",
175
+ "Var2": "y_idx_vect",
176
+ "ArgIndex2": "NotArgIndex"
177
+ },
178
+ {
179
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
180
+ "Var1": "tmp61",
181
+ "ArgIndex1": "NotArgIndex",
182
+ "Var2": "v_wy_bottom",
183
+ "ArgIndex2": "NotArgIndex"
184
+ },
185
+ {
186
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
187
+ "Var1": "tmp65",
188
+ "ArgIndex1": "NotArgIndex",
189
+ "Var2": "v_wy_top",
190
+ "ArgIndex2": "NotArgIndex"
191
+ },
192
+ {
193
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
194
+ "Var1": "tmp70",
195
+ "ArgIndex1": "NotArgIndex",
196
+ "Var2": "y_idx_vect",
197
+ "ArgIndex2": "NotArgIndex"
198
+ },
199
+ {
200
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
201
+ "Var1": "tmp71",
202
+ "ArgIndex1": "NotArgIndex",
203
+ "Var2": "y_idx_vect_d1x",
204
+ "ArgIndex2": "NotArgIndex"
205
+ },
206
+ {
207
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
208
+ "Var1": "tmp72",
209
+ "ArgIndex1": "NotArgIndex",
210
+ "Var2": "y_idx_vect_d1x",
211
+ "ArgIndex2": "NotArgIndex"
212
+ },
213
+ {
214
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
215
+ "Var1": "tmp84",
216
+ "ArgIndex1": "NotArgIndex",
217
+ "Var2": "x_idx_vect",
218
+ "ArgIndex2": "NotArgIndex"
219
+ },
220
+ {
221
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
222
+ "Var1": "tmp85",
223
+ "ArgIndex1": "NotArgIndex",
224
+ "Var2": "x_idx_vect",
225
+ "ArgIndex2": "NotArgIndex"
226
+ },
227
+ {
228
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
229
+ "Var1": "tmp96",
230
+ "ArgIndex1": "NotArgIndex",
231
+ "Var2": "v_wx_right",
232
+ "ArgIndex2": "NotArgIndex"
233
+ },
234
+ {
235
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
236
+ "Var1": "tmp100",
237
+ "ArgIndex1": "NotArgIndex",
238
+ "Var2": "v_wx_left",
239
+ "ArgIndex2": "NotArgIndex"
240
+ },
241
+ {
242
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
243
+ "Var1": "tmp105",
244
+ "ArgIndex1": "NotArgIndex",
245
+ "Var2": "x_idx_vect",
246
+ "ArgIndex2": "NotArgIndex"
247
+ },
248
+ {
249
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
250
+ "Var1": "tmp106",
251
+ "ArgIndex1": "NotArgIndex",
252
+ "Var2": "x_idx_vect_dx1",
253
+ "ArgIndex2": "NotArgIndex"
254
+ },
255
+ {
256
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
257
+ "Var1": "tmp107",
258
+ "ArgIndex1": "NotArgIndex",
259
+ "Var2": "x_idx_vect_dx1",
260
+ "ArgIndex2": "NotArgIndex"
261
+ },
262
+ {
263
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
264
+ "Var1": "d00_in",
265
+ "ArgIndex1": "NotArgIndex",
266
+ "Var2": "d00",
267
+ "ArgIndex2": "NotArgIndex"
268
+ },
269
+ {
270
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
271
+ "Var1": "d01_in",
272
+ "ArgIndex1": "NotArgIndex",
273
+ "Var2": "d01",
274
+ "ArgIndex2": "NotArgIndex"
275
+ },
276
+ {
277
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
278
+ "Var1": "d10_in",
279
+ "ArgIndex1": "NotArgIndex",
280
+ "Var2": "d10",
281
+ "ArgIndex2": "NotArgIndex"
282
+ },
283
+ {
284
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
285
+ "Var1": "d11_in",
286
+ "ArgIndex1": "NotArgIndex",
287
+ "Var2": "d11",
288
+ "ArgIndex2": "NotArgIndex"
289
+ },
290
+ {
291
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
292
+ "Var1": "tmp162",
293
+ "ArgIndex1": "NotArgIndex",
294
+ "Var2": "temp_acc_d00",
295
+ "ArgIndex2": "NotArgIndex"
296
+ },
297
+ {
298
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
299
+ "Var1": "tmp164",
300
+ "ArgIndex1": "NotArgIndex",
301
+ "Var2": "temp_acc_d01",
302
+ "ArgIndex2": "NotArgIndex"
303
+ },
304
+ {
305
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
306
+ "Var1": "tmp166",
307
+ "ArgIndex1": "NotArgIndex",
308
+ "Var2": "temp_acc_d10",
309
+ "ArgIndex2": "NotArgIndex"
310
+ },
311
+ {
312
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
313
+ "Var1": "tmp168",
314
+ "ArgIndex1": "NotArgIndex",
315
+ "Var2": "temp_acc_d11",
316
+ "ArgIndex2": "NotArgIndex"
317
+ },
318
+ {
319
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
320
+ "Var1": "tmp170",
321
+ "ArgIndex1": "NotArgIndex",
322
+ "Var2": "temp_add_d0",
323
+ "ArgIndex2": "NotArgIndex"
324
+ },
325
+ {
326
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
327
+ "Var1": "tmp172",
328
+ "ArgIndex1": "NotArgIndex",
329
+ "Var2": "temp_add_d1",
330
+ "ArgIndex2": "NotArgIndex"
331
+ },
332
+ {
333
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
334
+ "Var1": "tmp174",
335
+ "ArgIndex1": "NotArgIndex",
336
+ "Var2": "temp_add_dt",
337
+ "ArgIndex2": "NotArgIndex"
338
+ },
339
+ {
340
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
341
+ "Var1": "tmp178",
342
+ "ArgIndex1": "NotArgIndex",
343
+ "Var2": "temp_add_db",
344
+ "ArgIndex2": "NotArgIndex"
345
+ },
346
+ {
347
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
348
+ "Var1": "tmp182",
349
+ "ArgIndex1": "NotArgIndex",
350
+ "Var2": "temp_add_v",
351
+ "ArgIndex2": "NotArgIndex"
352
+ },
353
+ {
354
+ "FunctionName": "_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params",
355
+ "Var1": "dst_out",
356
+ "ArgIndex1": "NotArgIndex",
357
+ "Var2": "dst_v",
358
+ "ArgIndex2": "NotArgIndex"
359
+ },
360
+ {
361
+ "FunctionName": "set_satmode(unsigned int)",
362
+ "Var1": "tmp",
363
+ "ArgIndex1": "NotArgIndex",
364
+ "Var2": "_ZN12me_primitive11control_satE",
365
+ "ArgIndex2": "NotArgIndex"
366
+ },
367
+ {
368
+ "FunctionName": "set_rnd(unsigned int)",
369
+ "Var1": "tmp",
370
+ "ArgIndex1": "NotArgIndex",
371
+ "Var2": "_ZN12me_primitive11control_rndE",
372
+ "ArgIndex2": "NotArgIndex"
373
+ },
374
+ {
375
+ "FunctionName": "aie::vector_elem_ref<int, 32u>::operator=(int const&)",
376
+ "Var1": "this.addr",
377
+ "ArgIndex1": "0",
378
+ "Var2": "offset",
379
+ "ArgIndex2": "NotArgIndex"
380
+ },
381
+ {
382
+ "FunctionName": "aie::vector_elem_ref<int, 32u>::operator=(int const&)",
383
+ "Var1": "this.addr",
384
+ "ArgIndex1": "0",
385
+ "Var2": "parent",
386
+ "ArgIndex2": "NotArgIndex"
387
+ },
388
+ {
389
+ "FunctionName": "v32accfloat::v32accfloat(v32float)",
390
+ "Var1": "tmp",
391
+ "ArgIndex1": "NotArgIndex",
392
+ "Var2": "this1",
393
+ "ArgIndex2": "0"
394
+ },
395
+ {
396
+ "FunctionName": "_ZN3aiemiINS_15vector_elem_refIiLj32EEEiQoosr6detailE20is_vector_elem_ref_vIT_Esr6detailE20is_vector_elem_ref_vIT0_EEEDaS3_S4_",
397
+ "Var1": "v1",
398
+ "ArgIndex1": "NotArgIndex",
399
+ "Var2": "agg.tmp",
400
+ "ArgIndex2": "NotArgIndex"
401
+ },
402
+ {
403
+ "FunctionName": "aie::detail::vector_base<int, 16u>::vector_base(v16int32)",
404
+ "Var1": "data",
405
+ "ArgIndex1": "NotArgIndex",
406
+ "Var2": "data2",
407
+ "ArgIndex2": "NotArgIndex"
408
+ },
409
+ {
410
+ "FunctionName": "void aie::detail::vector_base<int, 32u>::insert_helper<16u>(unsigned int, aie::detail::vector_base<int, 16u> const&)",
411
+ "Var1": "tmp",
412
+ "ArgIndex1": "NotArgIndex",
413
+ "Var2": "call2",
414
+ "ArgIndex2": "NotArgIndex"
415
+ },
416
+ {
417
+ "FunctionName": "_ZNK3aie6detail11vector_baseIiLj16EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
418
+ "Var1": "this.addr",
419
+ "ArgIndex1": "0",
420
+ "Var2": "data",
421
+ "ArgIndex2": "NotArgIndex"
422
+ },
423
+ {
424
+ "FunctionName": "aie::unary_op_common<aie::vector<int, 32u>, (aie::Operation)0>::parent1() const",
425
+ "Var1": "this.addr",
426
+ "ArgIndex1": "0",
427
+ "Var2": "parent_",
428
+ "ArgIndex2": "NotArgIndex"
429
+ },
430
+ {
431
+ "FunctionName": "aie::unary_op_common<aie::vector<int, 32u>, (aie::Operation)0>::parent1() const",
432
+ "Var1": "parent_",
433
+ "ArgIndex1": "NotArgIndex",
434
+ "Var2": "agg.result",
435
+ "ArgIndex2": "0"
436
+ },
437
+ {
438
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)7, 32u, float, int, 32u>::run(aie::vector<int, 32u> const&, int, bool)",
439
+ "Var1": "tmp20",
440
+ "ArgIndex1": "NotArgIndex",
441
+ "Var2": "vint_h",
442
+ "ArgIndex2": "0"
443
+ },
444
+ {
445
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)7, 32u, float, int, 32u>::run(aie::vector<int, 32u> const&, int, bool)",
446
+ "Var1": "tmp24",
447
+ "ArgIndex1": "NotArgIndex",
448
+ "Var2": "vint_l",
449
+ "ArgIndex2": "0"
450
+ },
451
+ {
452
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)7, 32u, float, int, 32u>::run(aie::vector<int, 32u> const&, int, bool)",
453
+ "Var1": "tmp28",
454
+ "ArgIndex1": "NotArgIndex",
455
+ "Var2": "tmp",
456
+ "ArgIndex2": "NotArgIndex"
457
+ },
458
+ {
459
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)7, 32u, float, int, 32u>::run(aie::vector<int, 32u> const&, int, bool)",
460
+ "Var1": "tmp32",
461
+ "ArgIndex1": "NotArgIndex",
462
+ "Var2": "vfp",
463
+ "ArgIndex2": "0"
464
+ },
465
+ {
466
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)7, 32u, float, int, 32u>::run(aie::vector<int, 32u> const&, int, bool)",
467
+ "Var1": "tmp36",
468
+ "ArgIndex1": "NotArgIndex",
469
+ "Var2": "vfp",
470
+ "ArgIndex2": "0"
471
+ },
472
+ {
473
+ "FunctionName": "aie::detail::vector_base<short, 32u>::vector_base(v32int16)",
474
+ "Var1": "data",
475
+ "ArgIndex1": "NotArgIndex",
476
+ "Var2": "data2",
477
+ "ArgIndex2": "NotArgIndex"
478
+ },
479
+ {
480
+ "FunctionName": "aie::detail::vector_base<bfloat16, 32u>::vector_base(v32bfloat16)",
481
+ "Var1": "data",
482
+ "ArgIndex1": "NotArgIndex",
483
+ "Var2": "data2",
484
+ "ArgIndex2": "NotArgIndex"
485
+ },
486
+ {
487
+ "FunctionName": "v32bfloat16::v32bfloat16(v32int16)",
488
+ "Var1": "tmp",
489
+ "ArgIndex1": "NotArgIndex",
490
+ "Var2": "this1",
491
+ "ArgIndex2": "0"
492
+ },
493
+ {
494
+ "FunctionName": "v32bfloat16::v32bfloat16(chessllvmInternal, v128int4)",
495
+ "Var1": "aw",
496
+ "ArgIndex1": "NotArgIndex",
497
+ "Var2": "mw",
498
+ "ArgIndex2": "NotArgIndex"
499
+ },
500
+ {
501
+ "FunctionName": "void aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 32u>::from_vector_sign<bfloat16>(aie::vector<bfloat16, 32u> const&, bool, int)",
502
+ "Var1": "tmp",
503
+ "ArgIndex1": "NotArgIndex",
504
+ "Var2": "data",
505
+ "ArgIndex2": "NotArgIndex"
506
+ },
507
+ {
508
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 32u>::operator v32accfloat() const",
509
+ "Var1": "this.addr",
510
+ "ArgIndex1": "0",
511
+ "Var2": "data",
512
+ "ArgIndex2": "NotArgIndex"
513
+ },
514
+ {
515
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj32EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
516
+ "Var1": "this.addr",
517
+ "ArgIndex1": "0",
518
+ "Var2": "data",
519
+ "ArgIndex2": "NotArgIndex"
520
+ },
521
+ {
522
+ "FunctionName": "void aie::detail::accum_base<(aie::detail::AccumClass)0, 32u, 32u>::from_vector_sign<unsigned short>(aie::vector<unsigned short, 32u> const&, bool, int)",
523
+ "Var1": "tmp",
524
+ "ArgIndex1": "NotArgIndex",
525
+ "Var2": "data",
526
+ "ArgIndex2": "NotArgIndex"
527
+ },
528
+ {
529
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)0, 32u, 32u>::operator v32acc32() const",
530
+ "Var1": "this.addr",
531
+ "ArgIndex1": "0",
532
+ "Var2": "data",
533
+ "ArgIndex2": "NotArgIndex"
534
+ },
535
+ {
536
+ "FunctionName": "get_satmode()",
537
+ "Var1": "_ZN12me_primitive11control_satE",
538
+ "ArgIndex1": "NotArgIndex",
539
+ "Var2": "ref.tmp",
540
+ "ArgIndex2": "NotArgIndex"
541
+ },
542
+ {
543
+ "FunctionName": "uint2_t::operator unsigned int() const",
544
+ "Var1": "this.addr",
545
+ "ArgIndex1": "0",
546
+ "Var2": "this1",
547
+ "ArgIndex2": "0"
548
+ },
549
+ {
550
+ "FunctionName": "uint2_t::operator unsigned int() const",
551
+ "Var1": "this1",
552
+ "ArgIndex1": "0",
553
+ "Var2": "tmp",
554
+ "ArgIndex2": "NotArgIndex"
555
+ },
556
+ {
557
+ "FunctionName": "_ZNK3aie6detail11vector_baseItLj32EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
558
+ "Var1": "this.addr",
559
+ "ArgIndex1": "0",
560
+ "Var2": "data",
561
+ "ArgIndex2": "NotArgIndex"
562
+ },
563
+ {
564
+ "FunctionName": "aie::detail::filter_bits_impl_common<16u, unsigned short, 64u, (aie::detail::FilterOp)2>::run(aie::vector<unsigned short, 64u> const&, aie::detail::filter_mode<16u, 64u> const&)",
565
+ "Var1": "filter.addr",
566
+ "ArgIndex1": "0",
567
+ "Var2": "mode",
568
+ "ArgIndex2": "NotArgIndex"
569
+ },
570
+ {
571
+ "FunctionName": "aie::detail::shuffle_mode<16u, 64u>::high() const",
572
+ "Var1": "this.addr",
573
+ "ArgIndex1": "0",
574
+ "Var2": "mode",
575
+ "ArgIndex2": "NotArgIndex"
576
+ },
577
+ {
578
+ "FunctionName": "aie::detail::vector_base<unsigned short, 32u>::vector_base(v32uint16)",
579
+ "Var1": "data",
580
+ "ArgIndex1": "NotArgIndex",
581
+ "Var2": "data2",
582
+ "ArgIndex2": "NotArgIndex"
583
+ },
584
+ {
585
+ "FunctionName": "v32uint16::v32uint16(v16int32)",
586
+ "Var1": "tmp",
587
+ "ArgIndex1": "NotArgIndex",
588
+ "Var2": "this1",
589
+ "ArgIndex2": "0"
590
+ },
591
+ {
592
+ "FunctionName": "v32uint16::v32uint16(chessllvmInternal, v128int4)",
593
+ "Var1": "aw",
594
+ "ArgIndex1": "NotArgIndex",
595
+ "Var2": "mw",
596
+ "ArgIndex2": "NotArgIndex"
597
+ },
598
+ {
599
+ "FunctionName": "aie::detail::shuffle_mode<16u, 64u>::low() const",
600
+ "Var1": "this.addr",
601
+ "ArgIndex1": "0",
602
+ "Var2": "mode",
603
+ "ArgIndex2": "NotArgIndex"
604
+ },
605
+ {
606
+ "FunctionName": "aie::detail::add_sub_accum_bits_impl_common<acc32, 32u, (aie::detail::AddSubOperation)0>::run(aie::accum<acc32, 32u> const&, bool, aie::accum<acc32, 32u> const&)",
607
+ "Var1": "tmp1",
608
+ "ArgIndex1": "NotArgIndex",
609
+ "Var2": "tmp",
610
+ "ArgIndex2": "NotArgIndex"
611
+ },
612
+ {
613
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)0, 32u, 64u>::operator v64acc32() const",
614
+ "Var1": "this.addr",
615
+ "ArgIndex1": "0",
616
+ "Var2": "data",
617
+ "ArgIndex2": "NotArgIndex"
618
+ },
619
+ {
620
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)0, 32u, 64u> aie::detail::accum_base<(aie::detail::AccumClass)0, 32u, 32u>::grow<64u>() const",
621
+ "Var1": "tmp",
622
+ "ArgIndex1": "NotArgIndex",
623
+ "Var2": "data2",
624
+ "ArgIndex2": "NotArgIndex"
625
+ },
626
+ {
627
+ "FunctionName": "auto aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 32u>::cast_to<acc32>() const",
628
+ "Var1": "tmp",
629
+ "ArgIndex1": "NotArgIndex",
630
+ "Var2": "data2",
631
+ "ArgIndex2": "NotArgIndex"
632
+ },
633
+ {
634
+ "FunctionName": "v32acc32::v32acc32(v32accfloat)",
635
+ "Var1": "mw",
636
+ "ArgIndex1": "NotArgIndex",
637
+ "Var2": "this1",
638
+ "ArgIndex2": "0"
639
+ },
640
+ {
641
+ "FunctionName": "aie::detail::add_sub_accum_bits_impl<accfloat, 32u, (aie::detail::AddSubOperation)1>::run(aie::accum<accfloat, 32u> const&, bool, aie::accum<accfloat, 32u> const&)",
642
+ "Var1": "tmp1",
643
+ "ArgIndex1": "NotArgIndex",
644
+ "Var2": "tmp",
645
+ "ArgIndex2": "NotArgIndex"
646
+ },
647
+ {
648
+ "FunctionName": "uint5_t::operator unsigned int() const",
649
+ "Var1": "this.addr",
650
+ "ArgIndex1": "0",
651
+ "Var2": "this1",
652
+ "ArgIndex2": "0"
653
+ },
654
+ {
655
+ "FunctionName": "uint5_t::operator unsigned int() const",
656
+ "Var1": "this1",
657
+ "ArgIndex1": "0",
658
+ "Var2": "tmp",
659
+ "ArgIndex2": "NotArgIndex"
660
+ },
661
+ {
662
+ "FunctionName": "auto aie::detail::accum_base<(aie::detail::AccumClass)0, 32u, 32u>::cast_to<accfloat>() const",
663
+ "Var1": "tmp",
664
+ "ArgIndex1": "NotArgIndex",
665
+ "Var2": "data2",
666
+ "ArgIndex2": "NotArgIndex"
667
+ },
668
+ {
669
+ "FunctionName": "v32accfloat::v32accfloat(v32acc32)",
670
+ "Var1": "tmp",
671
+ "ArgIndex1": "NotArgIndex",
672
+ "Var2": "this1",
673
+ "ArgIndex2": "0"
674
+ },
675
+ {
676
+ "FunctionName": "v32accfloat::v32accfloat(chessllvmInternal, v32acc32)",
677
+ "Var1": "aw",
678
+ "ArgIndex1": "NotArgIndex",
679
+ "Var2": "mw",
680
+ "ArgIndex2": "NotArgIndex"
681
+ },
682
+ {
683
+ "FunctionName": "aie::detail::add_sub_accum_bits_impl<accfloat, 32u, (aie::detail::AddSubOperation)0>::run(aie::accum<accfloat, 32u> const&, bool, aie::accum<accfloat, 32u> const&)",
684
+ "Var1": "tmp1",
685
+ "ArgIndex1": "NotArgIndex",
686
+ "Var2": "tmp",
687
+ "ArgIndex2": "NotArgIndex"
688
+ },
689
+ {
690
+ "FunctionName": "aie::vector<float, 32u> aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 32u>::to_vector_sign<float>(bool, int) const",
691
+ "Var1": "tmp",
692
+ "ArgIndex1": "NotArgIndex",
693
+ "Var2": "agg.result",
694
+ "ArgIndex2": "0"
695
+ },
696
+ {
697
+ "FunctionName": "v32float::v32float(v32accfloat)",
698
+ "Var1": "tmp",
699
+ "ArgIndex1": "NotArgIndex",
700
+ "Var2": "this1",
701
+ "ArgIndex2": "0"
702
+ },
703
+ {
704
+ "FunctionName": "_ZN3aie6detail11vector_baseIfLj32EEC2ERK8v32floatQaaeqclL_ZNS0_11vector_base4bitsEvEELi1024Entsr3stdE9is_same_vINS0_18native_vector_typeIT_XT0_EE4typeENS0_14vector_storageIS8_XT0_EE4typeEE",
705
+ "Var1": "tmp",
706
+ "ArgIndex1": "NotArgIndex",
707
+ "Var2": "call3",
708
+ "ArgIndex2": "NotArgIndex"
709
+ },
710
+ {
711
+ "FunctionName": "_ZN3aie6detail11vector_baseIfLj32EEC2ERK8v32floatQaaeqclL_ZNS0_11vector_base4bitsEvEELi1024Entsr3stdE9is_same_vINS0_18native_vector_typeIT_XT0_EE4typeENS0_14vector_storageIS8_XT0_EE4typeEE",
712
+ "Var1": "tmp4",
713
+ "ArgIndex1": "NotArgIndex",
714
+ "Var2": "call7",
715
+ "ArgIndex2": "NotArgIndex"
716
+ },
717
+ {
718
+ "FunctionName": "aie::unary_op_common<aie::vector<int, 32u>, (aie::Operation)0>::unary_op_common(aie::vector<int, 32u>)",
719
+ "Var1": "parent",
720
+ "ArgIndex1": "0",
721
+ "Var2": "parent_",
722
+ "ArgIndex2": "0"
723
+ },
724
+ {
725
+ "FunctionName": "_ZN3aie3mulITkNS_17AccumElemBaseTypeE8accfloatTkNS_10VectorOrOpENS_8unary_opINS_6vectorIfLj32EEELNS_9OperationE0EEETkNS_8ElemOrOpENS2_IfLS5_0EEEQaa15is_valid_size_vIT0_T1_E17is_valid_mul_op_vINS8_10value_typeES9_EEENS_5accumIT_XclsrS8_4sizeEEEERKS8_S9_",
726
+ "Var1": "a",
727
+ "ArgIndex1": "NotArgIndex",
728
+ "Var2": "agg.tmp3",
729
+ "ArgIndex2": "NotArgIndex"
730
+ },
731
+ {
732
+ "FunctionName": "aie::unary_op_common<aie::vector<float, 32u>, (aie::Operation)0>::parent1() const",
733
+ "Var1": "this.addr",
734
+ "ArgIndex1": "0",
735
+ "Var2": "parent_",
736
+ "ArgIndex2": "NotArgIndex"
737
+ },
738
+ {
739
+ "FunctionName": "aie::unary_op_common<aie::vector<float, 32u>, (aie::Operation)0>::parent1() const",
740
+ "Var1": "parent_",
741
+ "ArgIndex1": "NotArgIndex",
742
+ "Var2": "agg.result",
743
+ "ArgIndex2": "0"
744
+ },
745
+ {
746
+ "FunctionName": "aie::unary_op_common<float, (aie::Operation)0>::parent1() const",
747
+ "Var1": "this.addr",
748
+ "ArgIndex1": "0",
749
+ "Var2": "parent_",
750
+ "ArgIndex2": "NotArgIndex"
751
+ },
752
+ {
753
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
754
+ "Var1": "dummy0",
755
+ "ArgIndex1": "NotArgIndex",
756
+ "Var2": "dummy0",
757
+ "ArgIndex2": "NotArgIndex"
758
+ },
759
+ {
760
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
761
+ "Var1": "dummy0",
762
+ "ArgIndex1": "NotArgIndex",
763
+ "Var2": "dummy0",
764
+ "ArgIndex2": "NotArgIndex"
765
+ },
766
+ {
767
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
768
+ "Var1": "dummy0",
769
+ "ArgIndex1": "NotArgIndex",
770
+ "Var2": "dummy0",
771
+ "ArgIndex2": "NotArgIndex"
772
+ },
773
+ {
774
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
775
+ "Var1": "dummy0",
776
+ "ArgIndex1": "NotArgIndex",
777
+ "Var2": "dummy0",
778
+ "ArgIndex2": "NotArgIndex"
779
+ },
780
+ {
781
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
782
+ "Var1": "f",
783
+ "ArgIndex1": "NotArgIndex",
784
+ "Var2": "f",
785
+ "ArgIndex2": "NotArgIndex"
786
+ },
787
+ {
788
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
789
+ "Var1": "f",
790
+ "ArgIndex1": "NotArgIndex",
791
+ "Var2": "f",
792
+ "ArgIndex2": "NotArgIndex"
793
+ },
794
+ {
795
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
796
+ "Var1": "b",
797
+ "ArgIndex1": "NotArgIndex",
798
+ "Var2": "b",
799
+ "ArgIndex2": "NotArgIndex"
800
+ },
801
+ {
802
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
803
+ "Var1": "b",
804
+ "ArgIndex1": "NotArgIndex",
805
+ "Var2": "b",
806
+ "ArgIndex2": "NotArgIndex"
807
+ },
808
+ {
809
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
810
+ "Var1": "e",
811
+ "ArgIndex1": "NotArgIndex",
812
+ "Var2": "e",
813
+ "ArgIndex2": "NotArgIndex"
814
+ },
815
+ {
816
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
817
+ "Var1": "e",
818
+ "ArgIndex1": "NotArgIndex",
819
+ "Var2": "e",
820
+ "ArgIndex2": "NotArgIndex"
821
+ },
822
+ {
823
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
824
+ "Var1": "c",
825
+ "ArgIndex1": "NotArgIndex",
826
+ "Var2": "c",
827
+ "ArgIndex2": "NotArgIndex"
828
+ },
829
+ {
830
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
831
+ "Var1": "c",
832
+ "ArgIndex1": "NotArgIndex",
833
+ "Var2": "c",
834
+ "ArgIndex2": "NotArgIndex"
835
+ },
836
+ {
837
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
838
+ "Var1": "b",
839
+ "ArgIndex1": "NotArgIndex",
840
+ "Var2": "b",
841
+ "ArgIndex2": "NotArgIndex"
842
+ },
843
+ {
844
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
845
+ "Var1": "b",
846
+ "ArgIndex1": "NotArgIndex",
847
+ "Var2": "b",
848
+ "ArgIndex2": "NotArgIndex"
849
+ },
850
+ {
851
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
852
+ "Var1": "d",
853
+ "ArgIndex1": "NotArgIndex",
854
+ "Var2": "d",
855
+ "ArgIndex2": "NotArgIndex"
856
+ },
857
+ {
858
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
859
+ "Var1": "d",
860
+ "ArgIndex1": "NotArgIndex",
861
+ "Var2": "d",
862
+ "ArgIndex2": "NotArgIndex"
863
+ },
864
+ {
865
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
866
+ "Var1": "a",
867
+ "ArgIndex1": "NotArgIndex",
868
+ "Var2": "a",
869
+ "ArgIndex2": "NotArgIndex"
870
+ },
871
+ {
872
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
873
+ "Var1": "a",
874
+ "ArgIndex1": "NotArgIndex",
875
+ "Var2": "a",
876
+ "ArgIndex2": "NotArgIndex"
877
+ },
878
+ {
879
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
880
+ "Var1": "e",
881
+ "ArgIndex1": "NotArgIndex",
882
+ "Var2": "e",
883
+ "ArgIndex2": "NotArgIndex"
884
+ },
885
+ {
886
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
887
+ "Var1": "e",
888
+ "ArgIndex1": "NotArgIndex",
889
+ "Var2": "e",
890
+ "ArgIndex2": "NotArgIndex"
891
+ },
892
+ {
893
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
894
+ "Var1": "a",
895
+ "ArgIndex1": "NotArgIndex",
896
+ "Var2": "a",
897
+ "ArgIndex2": "NotArgIndex"
898
+ },
899
+ {
900
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
901
+ "Var1": "a",
902
+ "ArgIndex1": "NotArgIndex",
903
+ "Var2": "a",
904
+ "ArgIndex2": "NotArgIndex"
905
+ },
906
+ {
907
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
908
+ "Var1": "d",
909
+ "ArgIndex1": "NotArgIndex",
910
+ "Var2": "d",
911
+ "ArgIndex2": "NotArgIndex"
912
+ },
913
+ {
914
+ "FunctionName": "me_detail::mul_elem_32_accuracy_safe_inner(v32float, v32float, int)",
915
+ "Var1": "d",
916
+ "ArgIndex1": "NotArgIndex",
917
+ "Var2": "d",
918
+ "ArgIndex2": "NotArgIndex"
919
+ },
920
+ {
921
+ "FunctionName": "v32accfloat::operator+=(v32accfloat)",
922
+ "Var1": "this.addr",
923
+ "ArgIndex1": "0",
924
+ "Var2": "this1",
925
+ "ArgIndex2": "0"
926
+ },
927
+ {
928
+ "FunctionName": "v32accfloat::operator+=(v32accfloat)",
929
+ "Var1": "this.addr",
930
+ "ArgIndex1": "0",
931
+ "Var2": "this1",
932
+ "ArgIndex2": "0"
933
+ },
934
+ {
935
+ "FunctionName": "v32accfloat::operator+=(v32accfloat)",
936
+ "Var1": "tmp",
937
+ "ArgIndex1": "NotArgIndex",
938
+ "Var2": "this1",
939
+ "ArgIndex2": "0"
940
+ },
941
+ {
942
+ "FunctionName": "v32bfloat16::v32bfloat16(v32uint16)",
943
+ "Var1": "tmp",
944
+ "ArgIndex1": "NotArgIndex",
945
+ "Var2": "this1",
946
+ "ArgIndex2": "0"
947
+ },
948
+ {
949
+ "FunctionName": "get_rnd()",
950
+ "Var1": "_ZN12me_primitive11control_rndE",
951
+ "ArgIndex1": "NotArgIndex",
952
+ "Var2": "ref.tmp",
953
+ "ArgIndex2": "NotArgIndex"
954
+ },
955
+ {
956
+ "FunctionName": "uint4_t::operator unsigned int() const",
957
+ "Var1": "this.addr",
958
+ "ArgIndex1": "0",
959
+ "Var2": "this1",
960
+ "ArgIndex2": "0"
961
+ },
962
+ {
963
+ "FunctionName": "uint4_t::operator unsigned int() const",
964
+ "Var1": "this1",
965
+ "ArgIndex1": "0",
966
+ "Var2": "tmp",
967
+ "ArgIndex2": "NotArgIndex"
968
+ },
969
+ {
970
+ "FunctionName": "_ZN3aie6detail10accum_baseILNS0_10AccumClassE2ELj32ELj32EE6insertILj32ELj32EQleTL0__T1_EERS3_jRKNS1_ILS2_2EXT0_EXT_EEE",
971
+ "Var1": "acc.addr",
972
+ "ArgIndex1": "1",
973
+ "Var2": "data",
974
+ "ArgIndex2": "NotArgIndex"
975
+ },
976
+ {
977
+ "FunctionName": "_ZN3aie6detail10accum_baseILNS0_10AccumClassE2ELj32ELj32EE6insertILj32ELj32EQleTL0__T1_EERS3_jRKNS1_ILS2_2EXT0_EXT_EEE",
978
+ "Var1": "data",
979
+ "ArgIndex1": "NotArgIndex",
980
+ "Var2": "data2",
981
+ "ArgIndex2": "NotArgIndex"
982
+ },
983
+ {
984
+ "FunctionName": "v16float::v16float(v16int32)",
985
+ "Var1": "tmp",
986
+ "ArgIndex1": "NotArgIndex",
987
+ "Var2": "this1",
988
+ "ArgIndex2": "0"
989
+ },
990
+ {
991
+ "FunctionName": "v16float::v16float(chessllvmInternal, v128int4)",
992
+ "Var1": "aw",
993
+ "ArgIndex1": "NotArgIndex",
994
+ "Var2": "mw",
995
+ "ArgIndex2": "NotArgIndex"
996
+ },
997
+ {
998
+ "FunctionName": "void aie::detail::vector_base<float, 32u>::insert_helper<16u>(unsigned int, aie::detail::vector_base<float, 16u> const&)",
999
+ "Var1": "tmp",
1000
+ "ArgIndex1": "NotArgIndex",
1001
+ "Var2": "call2",
1002
+ "ArgIndex2": "NotArgIndex"
1003
+ },
1004
+ {
1005
+ "FunctionName": "_ZNK3aie6detail11vector_baseIfLj16EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
1006
+ "Var1": "this.addr",
1007
+ "ArgIndex1": "0",
1008
+ "Var2": "data",
1009
+ "ArgIndex2": "NotArgIndex"
1010
+ },
1011
+ {
1012
+ "FunctionName": "aie::unary_op_common<aie::vector<float, 32u>, (aie::Operation)0>::unary_op_common(aie::vector<float, 32u>)",
1013
+ "Var1": "parent",
1014
+ "ArgIndex1": "0",
1015
+ "Var2": "parent_",
1016
+ "ArgIndex2": "0"
1017
+ },
1018
+ {
1019
+ "FunctionName": "aie::unary_op_common<aie::accum<accfloat, 32u>, (aie::Operation)0>::parent1() const",
1020
+ "Var1": "this.addr",
1021
+ "ArgIndex1": "0",
1022
+ "Var2": "parent_",
1023
+ "ArgIndex2": "NotArgIndex"
1024
+ },
1025
+ {
1026
+ "FunctionName": "aie::unary_op_common<aie::accum<accfloat, 32u>, (aie::Operation)0>::unary_op_common(aie::accum<accfloat, 32u>)",
1027
+ "Var1": "parent",
1028
+ "ArgIndex1": "NotArgIndex",
1029
+ "Var2": "parent_",
1030
+ "ArgIndex2": "NotArgIndex"
1031
+ },
1032
+ {
1033
+ "FunctionName": "void aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 32u>::from_vector_sign<float>(aie::vector<float, 32u> const&, bool, int)",
1034
+ "Var1": "tmp",
1035
+ "ArgIndex1": "NotArgIndex",
1036
+ "Var2": "data",
1037
+ "ArgIndex2": "NotArgIndex"
1038
+ },
1039
+ {
1040
+ "FunctionName": "_ZN3aie6detail10accum_baseILNS0_10AccumClassE2ELj32ELj32EE7upd_allILj16EJLj16EEQaaeqT1_plTL0__frplTL0_0_fraaeqTL0__TL0_0_EEvRKNS1_ILS2_2ELj32EXT_EEEDpRKNS1_ILS2_2ELj32EXT0_EEE",
1041
+ "Var1": "tmp",
1042
+ "ArgIndex1": "NotArgIndex",
1043
+ "Var2": "data",
1044
+ "ArgIndex2": "NotArgIndex"
1045
+ },
1046
+ {
1047
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 16u>::operator v16accfloat() const",
1048
+ "Var1": "this.addr",
1049
+ "ArgIndex1": "0",
1050
+ "Var2": "data",
1051
+ "ArgIndex2": "NotArgIndex"
1052
+ },
1053
+ {
1054
+ "FunctionName": "v16accfloat::v16accfloat(v16float)",
1055
+ "Var1": "tmp",
1056
+ "ArgIndex1": "NotArgIndex",
1057
+ "Var2": "this1",
1058
+ "ArgIndex2": "0"
1059
+ },
1060
+ {
1061
+ "FunctionName": "aie::detail::vector_base<float, 16u>::vector_base(v16float)",
1062
+ "Var1": "data",
1063
+ "ArgIndex1": "NotArgIndex",
1064
+ "Var2": "data2",
1065
+ "ArgIndex2": "NotArgIndex"
1066
+ },
1067
+ {
1068
+ "FunctionName": "aie::detail::max_min_bits_impl_common<float, 16u, (aie::detail::MaxMinOperation)0>::run(aie::vector<float, 16u> const&, aie::vector<float, 16u> const&, bool)",
1069
+ "Var1": "tmp1",
1070
+ "ArgIndex1": "NotArgIndex",
1071
+ "Var2": "tmp",
1072
+ "ArgIndex2": "NotArgIndex"
1073
+ },
1074
+ {
1075
+ "FunctionName": "lt(v16float, v16float)",
1076
+ "Var1": "tmp",
1077
+ "ArgIndex1": "NotArgIndex",
1078
+ "Var2": "a",
1079
+ "ArgIndex2": "NotArgIndex"
1080
+ },
1081
+ {
1082
+ "FunctionName": "lt(v16float, v16float)",
1083
+ "Var1": "a",
1084
+ "ArgIndex1": "NotArgIndex",
1085
+ "Var2": "a",
1086
+ "ArgIndex2": "NotArgIndex"
1087
+ },
1088
+ {
1089
+ "FunctionName": "v16int32::v16int32(v16float)",
1090
+ "Var1": "tmp",
1091
+ "ArgIndex1": "NotArgIndex",
1092
+ "Var2": "this1",
1093
+ "ArgIndex2": "0"
1094
+ },
1095
+ {
1096
+ "FunctionName": "v16int32::v16int32(chessllvmInternal, v128int4)",
1097
+ "Var1": "aw",
1098
+ "ArgIndex1": "NotArgIndex",
1099
+ "Var2": "mw",
1100
+ "ArgIndex2": "NotArgIndex"
1101
+ },
1102
+ {
1103
+ "FunctionName": "aie::detail::vector_base<float, 16u> aie::detail::vector_base<float, 16u>::grow<16u>(unsigned int) const",
1104
+ "Var1": "this.addr",
1105
+ "ArgIndex1": "0",
1106
+ "Var2": "data",
1107
+ "ArgIndex2": "NotArgIndex"
1108
+ },
1109
+ {
1110
+ "FunctionName": "aie::detail::max_min_bits_impl_common<float, 16u, (aie::detail::MaxMinOperation)1>::run(aie::vector<float, 16u> const&, aie::vector<float, 16u> const&, bool)",
1111
+ "Var1": "tmp1",
1112
+ "ArgIndex1": "NotArgIndex",
1113
+ "Var2": "tmp",
1114
+ "ArgIndex2": "NotArgIndex"
1115
+ },
1116
+ {
1117
+ "FunctionName": "ge(v16float, v16float)",
1118
+ "Var1": "tmp",
1119
+ "ArgIndex1": "NotArgIndex",
1120
+ "Var2": "a",
1121
+ "ArgIndex2": "NotArgIndex"
1122
+ },
1123
+ {
1124
+ "FunctionName": "ge(v16float, v16float)",
1125
+ "Var1": "a",
1126
+ "ArgIndex1": "NotArgIndex",
1127
+ "Var2": "a",
1128
+ "ArgIndex2": "NotArgIndex"
1129
+ },
1130
+ {
1131
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1132
+ "Var1": "acc_input",
1133
+ "ArgIndex1": "NotArgIndex",
1134
+ "Var2": "vfp",
1135
+ "ArgIndex2": "0"
1136
+ },
1137
+ {
1138
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1139
+ "Var1": "tmp17",
1140
+ "ArgIndex1": "NotArgIndex",
1141
+ "Var2": "vfp",
1142
+ "ArgIndex2": "0"
1143
+ },
1144
+ {
1145
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1146
+ "Var1": "tmp19",
1147
+ "ArgIndex1": "NotArgIndex",
1148
+ "Var2": "vint",
1149
+ "ArgIndex2": "0"
1150
+ },
1151
+ {
1152
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1153
+ "Var1": "tmp25",
1154
+ "ArgIndex1": "NotArgIndex",
1155
+ "Var2": "out_h",
1156
+ "ArgIndex2": "NotArgIndex"
1157
+ },
1158
+ {
1159
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1160
+ "Var1": "tmp27",
1161
+ "ArgIndex1": "NotArgIndex",
1162
+ "Var2": "vint",
1163
+ "ArgIndex2": "0"
1164
+ },
1165
+ {
1166
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1167
+ "Var1": "tmp32",
1168
+ "ArgIndex1": "NotArgIndex",
1169
+ "Var2": "tmp",
1170
+ "ArgIndex2": "NotArgIndex"
1171
+ },
1172
+ {
1173
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1174
+ "Var1": "tmp36",
1175
+ "ArgIndex1": "NotArgIndex",
1176
+ "Var2": "vfp",
1177
+ "ArgIndex2": "0"
1178
+ },
1179
+ {
1180
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1181
+ "Var1": "tmp38",
1182
+ "ArgIndex1": "NotArgIndex",
1183
+ "Var2": "vfp",
1184
+ "ArgIndex2": "0"
1185
+ },
1186
+ {
1187
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1188
+ "Var1": "tmp40",
1189
+ "ArgIndex1": "NotArgIndex",
1190
+ "Var2": "vint",
1191
+ "ArgIndex2": "0"
1192
+ },
1193
+ {
1194
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1195
+ "Var1": "tmp52",
1196
+ "ArgIndex1": "NotArgIndex",
1197
+ "Var2": "tmp51",
1198
+ "ArgIndex2": "NotArgIndex"
1199
+ },
1200
+ {
1201
+ "FunctionName": "aie::detail::elementary_vector_bits_impl<(aie::detail::ElementaryOp)8, 32u, int, float, 32u>::run(aie::vector<float, 32u> const&, int, bool)",
1202
+ "Var1": "tmp58",
1203
+ "ArgIndex1": "NotArgIndex",
1204
+ "Var2": "agg.result",
1205
+ "ArgIndex2": "0"
1206
+ },
1207
+ {
1208
+ "FunctionName": "aie::detail::add_sub_accum_bits_impl_common<acc32, 32u, (aie::detail::AddSubOperation)1>::run(aie::accum<acc32, 32u> const&, bool, aie::accum<acc32, 32u> const&)",
1209
+ "Var1": "tmp1",
1210
+ "ArgIndex1": "NotArgIndex",
1211
+ "Var2": "tmp",
1212
+ "ArgIndex2": "NotArgIndex"
1213
+ },
1214
+ {
1215
+ "FunctionName": "void aie::detail::accum_base<(aie::detail::AccumClass)0, 32u, 32u>::from_vector_sign<short>(aie::vector<short, 32u> const&, bool, int)",
1216
+ "Var1": "tmp",
1217
+ "ArgIndex1": "NotArgIndex",
1218
+ "Var2": "data",
1219
+ "ArgIndex2": "NotArgIndex"
1220
+ },
1221
+ {
1222
+ "FunctionName": "_ZNK3aie6detail11vector_baseIsLj32EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
1223
+ "Var1": "this.addr",
1224
+ "ArgIndex1": "0",
1225
+ "Var2": "data",
1226
+ "ArgIndex2": "NotArgIndex"
1227
+ },
1228
+ {
1229
+ "FunctionName": "_ZN3aie6detail10accum_baseILNS0_10AccumClassE0ELj32ELj64EE6insertILj64ELj32EQleTL0__T1_EERS3_jRKNS1_ILS2_0EXT0_EXT_EEE",
1230
+ "Var1": "acc.addr",
1231
+ "ArgIndex1": "1",
1232
+ "Var2": "data",
1233
+ "ArgIndex2": "NotArgIndex"
1234
+ },
1235
+ {
1236
+ "FunctionName": "_ZN3aie6detail10accum_baseILNS0_10AccumClassE0ELj32ELj64EE6insertILj64ELj32EQleTL0__T1_EERS3_jRKNS1_ILS2_0EXT0_EXT_EEE",
1237
+ "Var1": "data",
1238
+ "ArgIndex1": "NotArgIndex",
1239
+ "Var2": "data2",
1240
+ "ArgIndex2": "NotArgIndex"
1241
+ },
1242
+ {
1243
+ "FunctionName": "aie::detail::add_sub_accum_bits_impl_common<acc64, 32u, (aie::detail::AddSubOperation)0>::run(aie::accum<acc64, 32u> const&, bool, aie::accum<acc64, 32u> const&)",
1244
+ "Var1": "tmp1",
1245
+ "ArgIndex1": "NotArgIndex",
1246
+ "Var2": "tmp",
1247
+ "ArgIndex2": "NotArgIndex"
1248
+ },
1249
+ {
1250
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)0, 64u, 32u>::operator v32acc64() const",
1251
+ "Var1": "this.addr",
1252
+ "ArgIndex1": "0",
1253
+ "Var2": "data",
1254
+ "ArgIndex2": "NotArgIndex"
1255
+ },
1256
+ {
1257
+ "FunctionName": "void aie::detail::accum_base<(aie::detail::AccumClass)0, 64u, 32u>::from_vector_sign<short>(aie::vector<short, 32u> const&, bool, int)",
1258
+ "Var1": "tmp",
1259
+ "ArgIndex1": "NotArgIndex",
1260
+ "Var2": "data",
1261
+ "ArgIndex2": "NotArgIndex"
1262
+ },
1263
+ {
1264
+ "FunctionName": "void aie::detail::accum_base<(aie::detail::AccumClass)0, 64u, 32u>::from_vector_sign<unsigned short>(aie::vector<unsigned short, 32u> const&, bool, int)",
1265
+ "Var1": "tmp",
1266
+ "ArgIndex1": "NotArgIndex",
1267
+ "Var2": "data",
1268
+ "ArgIndex2": "NotArgIndex"
1269
+ },
1270
+ {
1271
+ "FunctionName": "aie::detail::add_sub_accum_bits_impl_common<acc64, 32u, (aie::detail::AddSubOperation)1>::run(aie::accum<acc64, 32u> const&, bool, aie::accum<acc64, 32u> const&)",
1272
+ "Var1": "tmp1",
1273
+ "ArgIndex1": "NotArgIndex",
1274
+ "Var2": "tmp",
1275
+ "ArgIndex2": "NotArgIndex"
1276
+ },
1277
+ {
1278
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 64u>::operator v64accfloat() const",
1279
+ "Var1": "this.addr",
1280
+ "ArgIndex1": "0",
1281
+ "Var2": "data",
1282
+ "ArgIndex2": "NotArgIndex"
1283
+ },
1284
+ {
1285
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 64u> aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 32u>::grow<64u>() const",
1286
+ "Var1": "tmp",
1287
+ "ArgIndex1": "NotArgIndex",
1288
+ "Var2": "data2",
1289
+ "ArgIndex2": "NotArgIndex"
1290
+ },
1291
+ {
1292
+ "FunctionName": "_ZN3aie3mulITkNS_17AccumElemBaseTypeE5acc64TkNS_10VectorOrOpENS_8unary_opINS_6vectorIiLj32EEELNS_9OperationE0EEETkNS_8ElemOrOpENS2_IiLS5_0EEEQaa15is_valid_size_vIT0_T1_E17is_valid_mul_op_vINS8_10value_typeES9_EEENS_5accumIT_XclsrS8_4sizeEEEERKS8_S9_",
1293
+ "Var1": "a",
1294
+ "ArgIndex1": "NotArgIndex",
1295
+ "Var2": "agg.tmp3",
1296
+ "ArgIndex2": "NotArgIndex"
1297
+ },
1298
+ {
1299
+ "FunctionName": "aie::unary_op_common<int, (aie::Operation)0>::parent1() const",
1300
+ "Var1": "this.addr",
1301
+ "ArgIndex1": "0",
1302
+ "Var2": "parent_",
1303
+ "ArgIndex2": "NotArgIndex"
1304
+ },
1305
+ {
1306
+ "FunctionName": "_ZN3aie6detail13mul_bits_implILNS0_10MulMacroOpE0ELj64ELj32EiLj32EiE3runILj32EJEQfraa10is_accum_vITL0_0_EEENS_5accumI5acc64XT_EEERKNS_6vectorIiXT_EEEbSC_bDpRKT0_",
1307
+ "Var1": "tmp",
1308
+ "ArgIndex1": "NotArgIndex",
1309
+ "Var2": "ret",
1310
+ "ArgIndex2": "NotArgIndex"
1311
+ },
1312
+ {
1313
+ "FunctionName": "mul_elem_32(v16int32, v16int32, int, v16int32, v16int32, int)",
1314
+ "Var1": "a_hi",
1315
+ "ArgIndex1": "NotArgIndex",
1316
+ "Var2": "b_hi",
1317
+ "ArgIndex2": "NotArgIndex"
1318
+ },
1319
+ {
1320
+ "FunctionName": "mul_elem_32(v16int32, v16int32, int, v16int32, v16int32, int)",
1321
+ "Var1": "tmp",
1322
+ "ArgIndex1": "NotArgIndex",
1323
+ "Var2": "retval",
1324
+ "ArgIndex2": "NotArgIndex"
1325
+ },
1326
+ {
1327
+ "FunctionName": "mul_elem_32(v16int32, v16int32, int, v16int32, v16int32, int)",
1328
+ "Var1": "a_lo",
1329
+ "ArgIndex1": "NotArgIndex",
1330
+ "Var2": "b_lo",
1331
+ "ArgIndex2": "NotArgIndex"
1332
+ },
1333
+ {
1334
+ "FunctionName": "mul_elem_32(v16int32, v16int32, int, v16int32, v16int32, int)",
1335
+ "Var1": "retval",
1336
+ "ArgIndex1": "NotArgIndex",
1337
+ "Var2": "retval",
1338
+ "ArgIndex2": "NotArgIndex"
1339
+ },
1340
+ {
1341
+ "FunctionName": "mul_elem_32(v16int32, v16int32, int, v16int32, v16int32, int)",
1342
+ "Var1": "tmp9",
1343
+ "ArgIndex1": "NotArgIndex",
1344
+ "Var2": "retval",
1345
+ "ArgIndex2": "NotArgIndex"
1346
+ },
1347
+ {
1348
+ "FunctionName": "mul_elem_32(v16int32, v16int32, int, v16int32, v16int32, int)",
1349
+ "Var1": "retval",
1350
+ "ArgIndex1": "NotArgIndex",
1351
+ "Var2": "retval",
1352
+ "ArgIndex2": "NotArgIndex"
1353
+ },
1354
+ {
1355
+ "FunctionName": "v32int16::v32int16(v16int32)",
1356
+ "Var1": "tmp",
1357
+ "ArgIndex1": "NotArgIndex",
1358
+ "Var2": "this1",
1359
+ "ArgIndex2": "0"
1360
+ },
1361
+ {
1362
+ "FunctionName": "v32int16::v32int16(chessllvmInternal, v128int4)",
1363
+ "Var1": "aw",
1364
+ "ArgIndex1": "NotArgIndex",
1365
+ "Var2": "mw",
1366
+ "ArgIndex2": "NotArgIndex"
1367
+ },
1368
+ {
1369
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)0, 64u, 16u>::operator v16acc64() const",
1370
+ "Var1": "this.addr",
1371
+ "ArgIndex1": "0",
1372
+ "Var2": "data",
1373
+ "ArgIndex2": "NotArgIndex"
1374
+ },
1375
+ {
1376
+ "FunctionName": "aie::detail::max_min_bits_impl_common<int, 16u, (aie::detail::MaxMinOperation)1>::run(aie::vector<int, 16u> const&, aie::vector<int, 16u> const&, bool)",
1377
+ "Var1": "tmp1",
1378
+ "ArgIndex1": "NotArgIndex",
1379
+ "Var2": "tmp",
1380
+ "ArgIndex2": "NotArgIndex"
1381
+ },
1382
+ {
1383
+ "FunctionName": "aie::detail::vector_base<int, 16u> aie::detail::vector_base<int, 16u>::grow<16u>(unsigned int) const",
1384
+ "Var1": "this.addr",
1385
+ "ArgIndex1": "0",
1386
+ "Var2": "data",
1387
+ "ArgIndex2": "NotArgIndex"
1388
+ },
1389
+ {
1390
+ "FunctionName": "aie::vector_elem_ref<int, 32u>::get() const",
1391
+ "Var1": "this.addr",
1392
+ "ArgIndex1": "0",
1393
+ "Var2": "offset",
1394
+ "ArgIndex2": "NotArgIndex"
1395
+ },
1396
+ {
1397
+ "FunctionName": "aie::vector_elem_ref<int, 32u>::get() const",
1398
+ "Var1": "this.addr",
1399
+ "ArgIndex1": "0",
1400
+ "Var2": "parent",
1401
+ "ArgIndex2": "NotArgIndex"
1402
+ },
1403
+ {
1404
+ "FunctionName": "aie::detail::vector_base<int, 16u>::get(unsigned int) const",
1405
+ "Var1": "this.addr",
1406
+ "ArgIndex1": "0",
1407
+ "Var2": "data",
1408
+ "ArgIndex2": "NotArgIndex"
1409
+ },
1410
+ {
1411
+ "FunctionName": "_ZN3aie6detail11vector_baseI8bfloat16Lj16EE14load_unalignedIL15aie_dm_resource0ES2_Qsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPKT0_j",
1412
+ "Var1": "tmp14",
1413
+ "ArgIndex1": "NotArgIndex",
1414
+ "Var2": "data",
1415
+ "ArgIndex2": "NotArgIndex"
1416
+ },
1417
+ {
1418
+ "FunctionName": "aie::detail::vector_base<bfloat16, 16u>::vector_base(v16bfloat16)",
1419
+ "Var1": "data",
1420
+ "ArgIndex1": "NotArgIndex",
1421
+ "Var2": "data2",
1422
+ "ArgIndex2": "NotArgIndex"
1423
+ },
1424
+ {
1425
+ "FunctionName": "void aie::detail::vector_base<bfloat16, 32u>::insert_helper<16u>(unsigned int, aie::detail::vector_base<bfloat16, 16u> const&)",
1426
+ "Var1": "this.addr",
1427
+ "ArgIndex1": "0",
1428
+ "Var2": "data",
1429
+ "ArgIndex2": "NotArgIndex"
1430
+ },
1431
+ {
1432
+ "FunctionName": "void aie::detail::vector_base<bfloat16, 32u>::insert_helper<16u>(unsigned int, aie::detail::vector_base<bfloat16, 16u> const&)",
1433
+ "Var1": "tmp",
1434
+ "ArgIndex1": "NotArgIndex",
1435
+ "Var2": "data3",
1436
+ "ArgIndex2": "NotArgIndex"
1437
+ },
1438
+ {
1439
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj16EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
1440
+ "Var1": "this.addr",
1441
+ "ArgIndex1": "0",
1442
+ "Var2": "data",
1443
+ "ArgIndex2": "NotArgIndex"
1444
+ },
1445
+ {
1446
+ "FunctionName": "aie::vector_elem_ref<bfloat16, 32u>::get() const",
1447
+ "Var1": "this.addr",
1448
+ "ArgIndex1": "0",
1449
+ "Var2": "offset",
1450
+ "ArgIndex2": "NotArgIndex"
1451
+ },
1452
+ {
1453
+ "FunctionName": "aie::vector_elem_ref<bfloat16, 32u>::get() const",
1454
+ "Var1": "this.addr",
1455
+ "ArgIndex1": "0",
1456
+ "Var2": "parent",
1457
+ "ArgIndex2": "NotArgIndex"
1458
+ },
1459
+ {
1460
+ "FunctionName": "aie::detail::vector_base<bfloat16, 32u>::get(unsigned int) const",
1461
+ "Var1": "this.addr",
1462
+ "ArgIndex1": "0",
1463
+ "Var2": "data",
1464
+ "ArgIndex2": "NotArgIndex"
1465
+ },
1466
+ {
1467
+ "FunctionName": "aie::unary_op_common<aie::vector<bfloat16, 16u>, (aie::Operation)0>::parent1() const",
1468
+ "Var1": "this.addr",
1469
+ "ArgIndex1": "0",
1470
+ "Var2": "parent_",
1471
+ "ArgIndex2": "NotArgIndex"
1472
+ },
1473
+ {
1474
+ "FunctionName": "_ZN3aie6detail10accum_baseILNS0_10AccumClassE2ELj32ELj16EE6insertILj16ELj32EQleTL0__T1_EERS3_jRKNS1_ILS2_2EXT0_EXT_EEE",
1475
+ "Var1": "acc.addr",
1476
+ "ArgIndex1": "1",
1477
+ "Var2": "data",
1478
+ "ArgIndex2": "NotArgIndex"
1479
+ },
1480
+ {
1481
+ "FunctionName": "_ZN3aie6detail10accum_baseILNS0_10AccumClassE2ELj32ELj16EE6insertILj16ELj32EQleTL0__T1_EERS3_jRKNS1_ILS2_2EXT0_EXT_EEE",
1482
+ "Var1": "data",
1483
+ "ArgIndex1": "NotArgIndex",
1484
+ "Var2": "data2",
1485
+ "ArgIndex2": "NotArgIndex"
1486
+ },
1487
+ {
1488
+ "FunctionName": "aie::unary_op_common<aie::vector<bfloat16, 16u>, (aie::Operation)0>::unary_op_common(aie::vector<bfloat16, 16u>)",
1489
+ "Var1": "parent",
1490
+ "ArgIndex1": "NotArgIndex",
1491
+ "Var2": "parent_",
1492
+ "ArgIndex2": "NotArgIndex"
1493
+ },
1494
+ {
1495
+ "FunctionName": "aie::unary_op_common<aie::accum<accfloat, 16u>, (aie::Operation)0>::parent1() const",
1496
+ "Var1": "this.addr",
1497
+ "ArgIndex1": "0",
1498
+ "Var2": "parent_",
1499
+ "ArgIndex2": "NotArgIndex"
1500
+ },
1501
+ {
1502
+ "FunctionName": "aie::detail::add_sub_accum_bits_impl<accfloat, 16u, (aie::detail::AddSubOperation)0>::run(aie::accum<accfloat, 16u> const&, bool, aie::accum<accfloat, 16u> const&)",
1503
+ "Var1": "tmp1",
1504
+ "ArgIndex1": "NotArgIndex",
1505
+ "Var2": "tmp",
1506
+ "ArgIndex2": "NotArgIndex"
1507
+ },
1508
+ {
1509
+ "FunctionName": "aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 32u> aie::detail::accum_base<(aie::detail::AccumClass)2, 32u, 16u>::grow<32u>() const",
1510
+ "Var1": "tmp",
1511
+ "ArgIndex1": "NotArgIndex",
1512
+ "Var2": "data2",
1513
+ "ArgIndex2": "NotArgIndex"
1514
+ },
1515
+ {
1516
+ "FunctionName": "aie::unary_op_common<aie::accum<accfloat, 16u>, (aie::Operation)0>::unary_op_common(aie::accum<accfloat, 16u>)",
1517
+ "Var1": "parent",
1518
+ "ArgIndex1": "NotArgIndex",
1519
+ "Var2": "parent_",
1520
+ "ArgIndex2": "NotArgIndex"
1521
+ },
1522
+ {
1523
+ "FunctionName": "aie::detail::vector_base<bfloat16, 16u> aie::detail::vector_base<bfloat16, 16u>::extract_helper<16u>(unsigned int) const",
1524
+ "Var1": "this.addr",
1525
+ "ArgIndex1": "0",
1526
+ "Var2": "this1",
1527
+ "ArgIndex2": "0"
1528
+ },
1529
+ {
1530
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj16EE5storeIL15aie_dm_resource0EU3AS5S2_Qsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPT0_",
1531
+ "Var1": "this.addr",
1532
+ "ArgIndex1": "0",
1533
+ "Var2": "data",
1534
+ "ArgIndex2": "NotArgIndex"
1535
+ },
1536
+ {
1537
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj16EE15store_unalignedIL15aie_dm_resource0EU3AS5S2_Qsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPT0_j",
1538
+ "Var1": "native_ptr",
1539
+ "ArgIndex1": "0",
1540
+ "Var2": "arrayidx",
1541
+ "ArgIndex2": "NotArgIndex"
1542
+ },
1543
+ {
1544
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj16EE15store_unalignedIL15aie_dm_resource0EU3AS5S2_Qsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPT0_j",
1545
+ "Var1": "native_ptr",
1546
+ "ArgIndex1": "0",
1547
+ "Var2": "arrayidx16",
1548
+ "ArgIndex2": "NotArgIndex"
1549
+ },
1550
+ {
1551
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj16EE15store_unalignedIL15aie_dm_resource0EU3AS5S2_Qsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPT0_j",
1552
+ "Var1": "tmp",
1553
+ "ArgIndex1": "NotArgIndex",
1554
+ "Var2": "arrayidx28",
1555
+ "ArgIndex2": "NotArgIndex"
1556
+ },
1557
+ {
1558
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj16EE15store_unalignedIL15aie_dm_resource0EU3AS5S2_Qsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPT0_j",
1559
+ "Var1": "tmp29",
1560
+ "ArgIndex1": "NotArgIndex",
1561
+ "Var2": "arrayidx33",
1562
+ "ArgIndex2": "NotArgIndex"
1563
+ },
1564
+ {
1565
+ "FunctionName": "aie::detail::vector_base<signed char, 64u>::vector_base(v64int8)",
1566
+ "Var1": "data",
1567
+ "ArgIndex1": "NotArgIndex",
1568
+ "Var2": "data2",
1569
+ "ArgIndex2": "NotArgIndex"
1570
+ },
1571
+ {
1572
+ "FunctionName": "aie::detail::vector_base<signed char, 32u>::vector_base(v32int8)",
1573
+ "Var1": "data",
1574
+ "ArgIndex1": "NotArgIndex",
1575
+ "Var2": "data2",
1576
+ "ArgIndex2": "NotArgIndex"
1577
+ },
1578
+ {
1579
+ "FunctionName": "v32int8::v32int8(v16bfloat16)",
1580
+ "Var1": "tmp",
1581
+ "ArgIndex1": "NotArgIndex",
1582
+ "Var2": "this1",
1583
+ "ArgIndex2": "0"
1584
+ },
1585
+ {
1586
+ "FunctionName": "v32int8::v32int8(chessllvmInternal, v64int4)",
1587
+ "Var1": "aw",
1588
+ "ArgIndex1": "NotArgIndex",
1589
+ "Var2": "mw",
1590
+ "ArgIndex2": "NotArgIndex"
1591
+ },
1592
+ {
1593
+ "FunctionName": "_ZNK3aie6detail11vector_baseIaLj32EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
1594
+ "Var1": "this.addr",
1595
+ "ArgIndex1": "0",
1596
+ "Var2": "data",
1597
+ "ArgIndex2": "NotArgIndex"
1598
+ },
1599
+ {
1600
+ "FunctionName": "_ZNK3aie6detail11vector_baseIaLj64EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
1601
+ "Var1": "this.addr",
1602
+ "ArgIndex1": "0",
1603
+ "Var2": "data",
1604
+ "ArgIndex2": "NotArgIndex"
1605
+ }
1606
+ ]
1607
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_results.json ADDED
@@ -0,0 +1,640 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ModulePath": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper.cpp",
3
+ "KernelSourcePath": "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp",
4
+ "UseCases": [
5
+ {
6
+ "Index": 0,
7
+ "KernelFunction": "mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 0>",
8
+ "InitializationFunction": "",
9
+ "KernelClassCtor": "",
10
+ "Instances": [
11
+ "i802",
12
+ "i803",
13
+ "i804",
14
+ "i805",
15
+ "i807",
16
+ "i808",
17
+ "i809",
18
+ "i810",
19
+ "i812",
20
+ "i813",
21
+ "i814",
22
+ "i815",
23
+ "i817",
24
+ "i818",
25
+ "i819",
26
+ "i820",
27
+ "i829",
28
+ "i830",
29
+ "i831",
30
+ "i832",
31
+ "i834",
32
+ "i835",
33
+ "i836",
34
+ "i837",
35
+ "i839",
36
+ "i840",
37
+ "i841",
38
+ "i842",
39
+ "i844",
40
+ "i845",
41
+ "i846",
42
+ "i847"
43
+ ]
44
+ }
45
+ ],
46
+ "AccessRecords": [],
47
+ "ControlRegsUsage": {
48
+ "RndRecords": {},
49
+ "SatRecords": {},
50
+ "SymSatRecords": {}
51
+ },
52
+ "ParameterLoads": {
53
+ "::operator()<aie::accum<acc32, 64U>, aie::accum<acc32, 64U>, bool, int, int, int>": [
54
+ "may",
55
+ "sometimes",
56
+ "sometimes",
57
+ "sometimes",
58
+ "sometimes",
59
+ "sometimes",
60
+ "sometimes"
61
+ ],
62
+ "::operator()<aie::accum<acc64, 32U>, aie::accum<acc64, 32U>, bool, int, int, int>": [
63
+ "may",
64
+ "sometimes",
65
+ "sometimes",
66
+ "sometimes",
67
+ "sometimes",
68
+ "sometimes",
69
+ "sometimes"
70
+ ],
71
+ "::operator()<aie::accum<accfloat, 32U>, aie::accum<accfloat, 32U>, bool, int, int>": [
72
+ "may",
73
+ "sometimes",
74
+ "sometimes",
75
+ "sometimes",
76
+ "sometimes",
77
+ "sometimes"
78
+ ],
79
+ "::operator()<aie::detail::utils::iteration_dim<unsigned int, 0U, 1U, 0U> >": [
80
+ "sometimes"
81
+ ],
82
+ "__regcall3__chessintr___sint_extract_elem_v16int32___sint___sint": [
83
+ "may",
84
+ "may",
85
+ "may"
86
+ ],
87
+ "__regcall3__chessintr___sint_read_coreid_": [],
88
+ "__regcall3__chessintr___uint___uint_uint2_t": [
89
+ "may"
90
+ ],
91
+ "__regcall3__chessintr___uint___uint_uint4_t": [
92
+ "may"
93
+ ],
94
+ "__regcall3__chessintr___uint___uint_uint5_t": [
95
+ "may"
96
+ ],
97
+ "__regcall3__chessintr___uint_select_bool___uint___uint": [
98
+ "may",
99
+ "may",
100
+ "may"
101
+ ],
102
+ "__regcall3__chessintr_bfloat16_extract_elem_v32bfloat16___sint___sint": [
103
+ "may",
104
+ "may",
105
+ "may"
106
+ ],
107
+ "__regcall3__chessintr_mask64_mask64___ulonglong": [
108
+ "may"
109
+ ],
110
+ "__regcall3__chessintr_uint1_t_uint1_t___sint": [
111
+ "may"
112
+ ],
113
+ "__regcall3__chessintr_uint2_t_uint2_t___uint": [
114
+ "may"
115
+ ],
116
+ "__regcall3__chessintr_uint4_t_uint4_t___uint": [
117
+ "may"
118
+ ],
119
+ "__regcall3__chessintr_uint5_t_uint5_t___sint": [
120
+ "may"
121
+ ],
122
+ "__regcall3__chessintr_uint5_t_uint5_t___uint": [
123
+ "may"
124
+ ],
125
+ "__regcall3__chessintr_uint6_t_uint6_t___sint": [
126
+ "may"
127
+ ],
128
+ "__regcall3__chessintr_v16acc64_ext_dh_v32acc64": [
129
+ "may"
130
+ ],
131
+ "__regcall3__chessintr_v16acc64_ext_dl_v32acc64": [
132
+ "may"
133
+ ],
134
+ "__regcall3__chessintr_v16acc64_undef_v16acc64": [],
135
+ "__regcall3__chessintr_v16accfloat_ext_ch_v32accfloat": [
136
+ "may"
137
+ ],
138
+ "__regcall3__chessintr_v16accfloat_ext_cl_v32accfloat": [
139
+ "may"
140
+ ],
141
+ "__regcall3__chessintr_v16accfloat_undef_v16accfloat": [],
142
+ "__regcall3__chessintr_v16accfloat_v16accfloat_v16float": [
143
+ "may"
144
+ ],
145
+ "__regcall3__chessintr_v16bfloat16_ext_xh_v32bfloat16": [
146
+ "may"
147
+ ],
148
+ "__regcall3__chessintr_v16bfloat16_ext_xl_v32bfloat16": [
149
+ "may"
150
+ ],
151
+ "__regcall3__chessintr_v16bfloat16_srs_v16accfloat_uint4_t_uint5_t": [
152
+ "may",
153
+ "may",
154
+ "may"
155
+ ],
156
+ "__regcall3__chessintr_v16bfloat16_undef_v16bfloat16": [],
157
+ "__regcall3__chessintr_v16float_ext_yh_v32float": [
158
+ "may"
159
+ ],
160
+ "__regcall3__chessintr_v16float_ext_yl_v32float": [
161
+ "may"
162
+ ],
163
+ "__regcall3__chessintr_v16float_undef_v16float": [],
164
+ "__regcall3__chessintr_v16int32_broadcast_s32___sint": [
165
+ "may"
166
+ ],
167
+ "__regcall3__chessintr_v16int32_broadcast_to_v16int32___sint": [
168
+ "may"
169
+ ],
170
+ "__regcall3__chessintr_v16int32_insert_v16int32___sint___sint": [
171
+ "may",
172
+ "may",
173
+ "may"
174
+ ],
175
+ "__regcall3__chessintr_v16int32_lsrs_v16acc64_uint6_t_uint1_t_uint1_t_uint2_t_uint4_t_bool": [
176
+ "may",
177
+ "may",
178
+ "may",
179
+ "may",
180
+ "may",
181
+ "may"
182
+ ],
183
+ "__regcall3__chessintr_v16int32_shiftx_v16int32_v16int32_uint6_t___uint": [
184
+ "may",
185
+ "may",
186
+ "may",
187
+ "may"
188
+ ],
189
+ "__regcall3__chessintr_v16int32_shuffle_v16int32_v16int32___uint": [
190
+ "may",
191
+ "may",
192
+ "may"
193
+ ],
194
+ "__regcall3__chessintr_v16int32_undef_v16int32": [],
195
+ "__regcall3__chessintr_v16int32_vadd32_v16int32_v16int32_uint1_t_uint5_t___uint___uint": [
196
+ "may",
197
+ "may",
198
+ "may",
199
+ "may",
200
+ "may"
201
+ ],
202
+ "__regcall3__chessintr_v32acc32_ext_dh_v64acc32": [
203
+ "may"
204
+ ],
205
+ "__regcall3__chessintr_v32acc32_ext_dl_v64acc32": [
206
+ "may"
207
+ ],
208
+ "__regcall3__chessintr_v32acc32_undef_v32acc32": [],
209
+ "__regcall3__chessintr_v32acc32_ups_x2c_v32int16_uint6_t_uint1_t_uint1_t_uint2_t_bool": [
210
+ "may",
211
+ "may",
212
+ "may",
213
+ "may",
214
+ "may"
215
+ ],
216
+ "__regcall3__chessintr_v32acc32_ups_x2c_v32uint16_uint6_t_uint1_t_uint1_t_uint2_t_bool": [
217
+ "may",
218
+ "may",
219
+ "may",
220
+ "may",
221
+ "may"
222
+ ],
223
+ "__regcall3__chessintr_v32acc64_add32_conf_v32acc64_v32acc64___sint_uint1_t_uint1_t": [
224
+ "may",
225
+ "may",
226
+ "may",
227
+ "may",
228
+ "may"
229
+ ],
230
+ "__regcall3__chessintr_v32acc64_mac32_conf_v32int16_v32uint16_v32acc64___sint_uint1_t_uint1_t": [
231
+ "may",
232
+ "may",
233
+ "may",
234
+ "may",
235
+ "may",
236
+ "may"
237
+ ],
238
+ "__regcall3__chessintr_v32acc64_mac32_conf_v32uint16_v32int16_v32acc64___sint_uint1_t_uint1_t": [
239
+ "may",
240
+ "may",
241
+ "may",
242
+ "may",
243
+ "may",
244
+ "may"
245
+ ],
246
+ "__regcall3__chessintr_v32acc64_mac32_conf_v32uint16_v32uint16_v32acc64___sint_uint1_t_uint1_t": [
247
+ "may",
248
+ "may",
249
+ "may",
250
+ "may",
251
+ "may",
252
+ "may"
253
+ ],
254
+ "__regcall3__chessintr_v32acc64_mul32_conf_v32int16_v32int16___sint_uint1_t": [
255
+ "may",
256
+ "may",
257
+ "may",
258
+ "may"
259
+ ],
260
+ "__regcall3__chessintr_v32acc64_undef_v32acc64": [],
261
+ "__regcall3__chessintr_v32acc64_ups_x2d_v32int16_uint6_t_uint1_t_uint1_t_uint2_t_bool": [
262
+ "may",
263
+ "may",
264
+ "may",
265
+ "may",
266
+ "may"
267
+ ],
268
+ "__regcall3__chessintr_v32acc64_ups_x2d_v32uint16_uint6_t_uint1_t_uint1_t_uint2_t_bool": [
269
+ "may",
270
+ "may",
271
+ "may",
272
+ "may",
273
+ "may"
274
+ ],
275
+ "__regcall3__chessintr_v32accfloat_add32_conf_v32accfloat_v32accfloat___sint_uint1_t_uint1_t_uint5_t": [
276
+ "may",
277
+ "may",
278
+ "may",
279
+ "may",
280
+ "may",
281
+ "may"
282
+ ],
283
+ "__regcall3__chessintr_v32accfloat_concat_cm_bm_v16accfloat_v16accfloat": [
284
+ "may",
285
+ "may"
286
+ ],
287
+ "__regcall3__chessintr_v32accfloat_ext_dh_v64accfloat": [
288
+ "may"
289
+ ],
290
+ "__regcall3__chessintr_v32accfloat_ext_dl_v64accfloat": [
291
+ "may"
292
+ ],
293
+ "__regcall3__chessintr_v32accfloat_mac32_conf_v32bfloat16_v32bfloat16_v32accfloat___sint_uint1_t_uint5_t": [
294
+ "may",
295
+ "may",
296
+ "may",
297
+ "may",
298
+ "may",
299
+ "may"
300
+ ],
301
+ "__regcall3__chessintr_v32accfloat_mul32_conf_v32bfloat16_v32bfloat16___sint_uint1_t_uint5_t": [
302
+ "may",
303
+ "may",
304
+ "may",
305
+ "may",
306
+ "may"
307
+ ],
308
+ "__regcall3__chessintr_v32accfloat_set_ch_v16accfloat": [
309
+ "may"
310
+ ],
311
+ "__regcall3__chessintr_v32accfloat_set_cl_v16accfloat": [
312
+ "may"
313
+ ],
314
+ "__regcall3__chessintr_v32accfloat_undef_v32accfloat": [],
315
+ "__regcall3__chessintr_v32accfloat_ups_to_v32accfloat_v32bfloat16": [
316
+ "may"
317
+ ],
318
+ "__regcall3__chessintr_v32accfloat_v32accfloat_v32float": [
319
+ "may"
320
+ ],
321
+ "__regcall3__chessintr_v32bfloat16_set_xh_v16bfloat16": [
322
+ "may"
323
+ ],
324
+ "__regcall3__chessintr_v32bfloat16_set_xl_v16bfloat16": [
325
+ "may"
326
+ ],
327
+ "__regcall3__chessintr_v32bfloat16_shiftx_v32bfloat16_v32bfloat16_uint6_t___uint": [
328
+ "may",
329
+ "may",
330
+ "may",
331
+ "may"
332
+ ],
333
+ "__regcall3__chessintr_v32bfloat16_srs_v32accfloat_uint4_t_uint5_t": [
334
+ "may",
335
+ "may",
336
+ "may"
337
+ ],
338
+ "__regcall3__chessintr_v32bfloat16_undef_v32bfloat16": [],
339
+ "__regcall3__chessintr_v32bfloat16_upd_xh_v32bfloat16_v16bfloat16": [
340
+ "may",
341
+ "may"
342
+ ],
343
+ "__regcall3__chessintr_v32bfloat16_upd_xl_v32bfloat16_v16bfloat16": [
344
+ "may",
345
+ "may"
346
+ ],
347
+ "__regcall3__chessintr_v32bfloat16_vadd16_v32bfloat16_v32bfloat16_uint1_t_uint1_t_uint5_t___uint___uint": [
348
+ "may",
349
+ "may",
350
+ "may",
351
+ "may",
352
+ "may",
353
+ "may"
354
+ ],
355
+ "__regcall3__chessintr_v32float_concat_y_x_v16float_v16float": [
356
+ "may",
357
+ "may"
358
+ ],
359
+ "__regcall3__chessintr_v32float_v32float_v32accfloat": [
360
+ "may"
361
+ ],
362
+ "__regcall3__chessintr_v32int16_broadcast_to_v32int16___sint": [
363
+ "may"
364
+ ],
365
+ "__regcall3__chessintr_v32int16_lsrs_v32acc32_uint6_t_uint1_t_uint1_t_uint2_t_uint4_t_bool": [
366
+ "may",
367
+ "may",
368
+ "may",
369
+ "may",
370
+ "may",
371
+ "may"
372
+ ],
373
+ "__regcall3__chessintr_v32int16_undef_v32int16": [],
374
+ "__regcall3__chessintr_v32int8_ext_xh_v64int8": [
375
+ "may"
376
+ ],
377
+ "__regcall3__chessintr_v32int8_ext_xl_v64int8": [
378
+ "may"
379
+ ],
380
+ "__regcall3__chessintr_v32uint16_broadcast_u16___uint": [
381
+ "may"
382
+ ],
383
+ "__regcall3__chessintr_v32uint16_shuffle_v32uint16_v32uint16___uint": [
384
+ "may",
385
+ "may",
386
+ "may"
387
+ ],
388
+ "__regcall3__chessintr_v32uint16_ulsrs_v32acc32_uint6_t_uint1_t_uint1_t_uint2_t_uint4_t_bool": [
389
+ "may",
390
+ "may",
391
+ "may",
392
+ "may",
393
+ "may",
394
+ "may"
395
+ ],
396
+ "__regcall3__chessintr_v32uint16_undef_v32uint16": [],
397
+ "__regcall3__chessintr_v64acc32_add64_conf_v64acc32_v64acc32___sint_uint1_t_uint1_t": [
398
+ "may",
399
+ "may",
400
+ "may",
401
+ "may",
402
+ "may"
403
+ ],
404
+ "__regcall3__chessintr_v64acc32_neg64_conf_v64acc32___sint": [
405
+ "may",
406
+ "may"
407
+ ],
408
+ "__regcall3__chessintr_v64acc32_set_dh_v32acc32": [
409
+ "may"
410
+ ],
411
+ "__regcall3__chessintr_v64acc32_set_dl_v32acc32": [
412
+ "may"
413
+ ],
414
+ "__regcall3__chessintr_v64acc32_undef_v64acc32": [],
415
+ "__regcall3__chessintr_v64accfloat_add64_conf_v64accfloat_v64accfloat___sint_uint1_t_uint1_t_uint5_t": [
416
+ "may",
417
+ "may",
418
+ "may",
419
+ "may",
420
+ "may",
421
+ "may"
422
+ ],
423
+ "__regcall3__chessintr_v64accfloat_set_dh_v32accfloat": [
424
+ "may"
425
+ ],
426
+ "__regcall3__chessintr_v64accfloat_set_dl_v32accfloat": [
427
+ "may"
428
+ ],
429
+ "__regcall3__chessintr_v64accfloat_undef_v64accfloat": [],
430
+ "__regcall3__chessintr_v64int8_set_xh_v32int8": [
431
+ "may"
432
+ ],
433
+ "__regcall3__chessintr_v64int8_set_xl_v32int8": [
434
+ "may"
435
+ ],
436
+ "__regcall3__chessintr_v64int8_shiftx_v64int8_v64int8_uint6_t___uint": [
437
+ "may",
438
+ "may",
439
+ "may",
440
+ "may"
441
+ ],
442
+ "__regcall3__chessintr_v64int8_undef_v64int8": [],
443
+ "__regcall3__chessintr_v64int8_upd_xh_v64int8_v32int8": [
444
+ "may",
445
+ "may"
446
+ ],
447
+ "__regcall3__chessintr_v64int8_upd_xl_v64int8_v32int8": [
448
+ "may",
449
+ "may"
450
+ ],
451
+ "__regcall3__chessintr_v64int8_vadd8_v64int8_v64int8_uint1_t_uint5_t_mask64_mask64": [
452
+ "may",
453
+ "may",
454
+ "may",
455
+ "may",
456
+ "may"
457
+ ],
458
+ "llvm.assume": [
459
+ "may"
460
+ ],
461
+ "llvm.chess.convert.customint.i32.s_struct.ipd.custom_type.uint2_ts.p1": [
462
+ "may",
463
+ "may",
464
+ "may",
465
+ "may",
466
+ "may",
467
+ "may",
468
+ "may"
469
+ ],
470
+ "llvm.chess.convert.customint.i32.s_struct.ipd.custom_type.uint4_ts.p1": [
471
+ "may",
472
+ "may",
473
+ "may",
474
+ "may",
475
+ "may",
476
+ "may",
477
+ "may"
478
+ ],
479
+ "llvm.chess.convert.customint.i32.s_struct.ipd.custom_type.uint5_ts.p1": [
480
+ "may",
481
+ "may",
482
+ "may",
483
+ "may",
484
+ "may",
485
+ "may",
486
+ "may"
487
+ ],
488
+ "llvm.chess.copy.p0": [
489
+ "may"
490
+ ],
491
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint1_ts.i32.p1": [
492
+ "may",
493
+ "may",
494
+ "may",
495
+ "may",
496
+ "may",
497
+ "may",
498
+ "may"
499
+ ],
500
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint2_ts.i32.p1": [
501
+ "may",
502
+ "may",
503
+ "may",
504
+ "may",
505
+ "may",
506
+ "may",
507
+ "may"
508
+ ],
509
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint4_ts.i32.p1": [
510
+ "may",
511
+ "may",
512
+ "may",
513
+ "may",
514
+ "may",
515
+ "may",
516
+ "may"
517
+ ],
518
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint5_ts.i32.p1": [
519
+ "may",
520
+ "may",
521
+ "may",
522
+ "may",
523
+ "may",
524
+ "may",
525
+ "may"
526
+ ],
527
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint6_ts.i32.p1": [
528
+ "may",
529
+ "may",
530
+ "may",
531
+ "may",
532
+ "may",
533
+ "may",
534
+ "may"
535
+ ],
536
+ "llvm.chess.init.customint.s_struct.mask64s.i64.p1": [
537
+ "may",
538
+ "may",
539
+ "may",
540
+ "may",
541
+ "may",
542
+ "may",
543
+ "may"
544
+ ],
545
+ "llvm.chess_error": [
546
+ "may"
547
+ ],
548
+ "llvm.chess_manifest": [
549
+ "may"
550
+ ],
551
+ "llvm.ctlz.i32": [
552
+ "may",
553
+ "may"
554
+ ],
555
+ "llvm.dbg.declare": [
556
+ "may",
557
+ "may",
558
+ "may"
559
+ ],
560
+ "llvm.dbg.value": [
561
+ "may",
562
+ "may",
563
+ "may"
564
+ ],
565
+ "llvm.experimental.noalias.scope.decl": [
566
+ "may"
567
+ ],
568
+ "llvm.is.constant.i1": [
569
+ "may"
570
+ ],
571
+ "llvm.lifetime.end.p0": [
572
+ "may",
573
+ "may"
574
+ ],
575
+ "llvm.lifetime.start.p0": [
576
+ "may",
577
+ "may"
578
+ ],
579
+ "llvm.memcpy.p0.p0.i32": [
580
+ "may",
581
+ "may",
582
+ "may",
583
+ "may"
584
+ ],
585
+ "llvm.memset.p0.i32": [
586
+ "may",
587
+ "may",
588
+ "may",
589
+ "may"
590
+ ],
591
+ "llvm.noalias.decl.p0.p0.i32": [
592
+ "may",
593
+ "may",
594
+ "may"
595
+ ],
596
+ "llvm.noalias.p0.p0.p0.i32": [
597
+ "may",
598
+ "may",
599
+ "may",
600
+ "may",
601
+ "may"
602
+ ],
603
+ "llvm.write_register.s_struct.ipd.custom_type.v32acc32s": [
604
+ "may",
605
+ "may"
606
+ ],
607
+ "operator()<aie::accum<accfloat, 64U>, aie::accum<accfloat, 64U> >": [
608
+ "no",
609
+ "may",
610
+ "may"
611
+ ],
612
+ "operator()<aie::vector<int, 16U>, aie::vector<int, 16U> >": [
613
+ "no",
614
+ "may",
615
+ "may"
616
+ ],
617
+ "resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> >, 1, 0, 0>": [
618
+ "sometimes",
619
+ "sometimes",
620
+ "sometimes"
621
+ ],
622
+ "resize_bilinear<bfloat16>": [
623
+ "sometimes",
624
+ "may",
625
+ "sometimes"
626
+ ],
627
+ "run": [
628
+ "may",
629
+ "sometimes"
630
+ ],
631
+ "undef": [],
632
+ "vector_elem_ref<int, 32U>::get": [
633
+ "sometimes"
634
+ ],
635
+ "vector_elem_ref<int, 32U>::operator=": [
636
+ "sometimes",
637
+ "sometimes"
638
+ ]
639
+ }
640
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper_spec.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "KernelAnalysisSpec": {
3
+ "ModulePath": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i802_wrap_resize_adf_wrapper.cpp",
4
+ "KernelSourcePath": "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp",
5
+ "SpecFile": "i802_wrap_resize_adf_wrapper_spec.json",
6
+ "ResultFile": "i802_wrap_resize_adf_wrapper_results.json",
7
+ "UseCases": [
8
+ {
9
+ "Index": 0,
10
+ "KernelFunction": "mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 0>",
11
+ "InitializationFunction": "",
12
+ "KernelClassCtor": "",
13
+ "Instances": [
14
+ "i802",
15
+ "i803",
16
+ "i804",
17
+ "i805",
18
+ "i807",
19
+ "i808",
20
+ "i809",
21
+ "i810",
22
+ "i812",
23
+ "i813",
24
+ "i814",
25
+ "i815",
26
+ "i817",
27
+ "i818",
28
+ "i819",
29
+ "i820",
30
+ "i829",
31
+ "i830",
32
+ "i831",
33
+ "i832",
34
+ "i834",
35
+ "i835",
36
+ "i836",
37
+ "i837",
38
+ "i839",
39
+ "i840",
40
+ "i841",
41
+ "i842",
42
+ "i844",
43
+ "i845",
44
+ "i846",
45
+ "i847"
46
+ ]
47
+ }
48
+ ]
49
+ }
50
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper.cpp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ #include "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/slice_adf_wrapper.cpp"
2
+ template void mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[7]);
3
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_analysis.json ADDED
@@ -0,0 +1,435 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ModuleName": "i852_wrap_slice_adf_wrapper",
3
+ "SourceFileName": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper.cpp",
4
+ "StructTypes": [
5
+ {
6
+ "Name": "struct.aie::detail::add_op",
7
+ "Size": 1
8
+ },
9
+ {
10
+ "Name": "struct.slice_hcwc8_params",
11
+ "Size": 128
12
+ },
13
+ {
14
+ "Name": "struct.ipd.custom_type.bfloat16",
15
+ "Size": 2
16
+ },
17
+ {
18
+ "Name": "struct.ipd.custom_type.addr_t",
19
+ "Size": 4
20
+ },
21
+ {
22
+ "Name": "class.aie::mask",
23
+ "Size": 8
24
+ },
25
+ {
26
+ "Name": "struct.std::__2::array",
27
+ "Size": 8
28
+ },
29
+ {
30
+ "Name": "class.aie::vector",
31
+ "Size": 64
32
+ },
33
+ {
34
+ "Name": "class.aie::detail::vector_base",
35
+ "Size": 64
36
+ },
37
+ {
38
+ "Name": "struct.v64int8",
39
+ "Size": 64
40
+ },
41
+ {
42
+ "Name": "struct.ipd.custom_type.v128int4",
43
+ "Size": 64
44
+ },
45
+ {
46
+ "Name": "struct.adf::detail::io_buffer_base",
47
+ "Size": 4
48
+ },
49
+ {
50
+ "Name": "struct.chessout___Pvoid_add_2d_byte_int___Pvoid___sint___sint_addr_t_addr_t_addr_t",
51
+ "Size": 8
52
+ },
53
+ {
54
+ "Name": "struct.ipd.custom_type.uint6_t",
55
+ "Size": 1
56
+ },
57
+ {
58
+ "Name": "struct.mask64",
59
+ "Size": 8
60
+ },
61
+ {
62
+ "Name": "struct.ipd.custom_type.v16int4",
63
+ "Size": 8
64
+ },
65
+ {
66
+ "Name": "struct.ipd.custom_type.uint1_t",
67
+ "Size": 1
68
+ },
69
+ {
70
+ "Name": "struct.ipd.custom_type.uint5_t",
71
+ "Size": 1
72
+ },
73
+ {
74
+ "Name": "struct.std::__2::array.1",
75
+ "Size": 8
76
+ },
77
+ {
78
+ "Name": "struct.me_primitive::chessout_v64int8_vadd8_v64int8_v64int8_uint1_t_uint5_t_mask64_mask64",
79
+ "Size": 72
80
+ },
81
+ {
82
+ "Name": "struct.chessout___Pvoid_add_3d_byte_int___Pvoid___sint___sint___sint_addr_t_addr_t_addr_t_addr_t_addr_t_addr_t",
83
+ "Size": 12
84
+ },
85
+ {
86
+ "Name": "struct.ipd.custom_type.tm_byte_t",
87
+ "Size": 1
88
+ },
89
+ {
90
+ "Name": "vector_base<signed char, 64U>",
91
+ "Size": 64
92
+ },
93
+ {
94
+ "Name": "mask<64U>",
95
+ "Size": 8
96
+ },
97
+ {
98
+ "Name": "vector<signed char, 64U>",
99
+ "Size": 64
100
+ },
101
+ {
102
+ "Name": "io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> > >",
103
+ "Size": 0
104
+ },
105
+ {
106
+ "Name": "io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> > >",
107
+ "Size": 0
108
+ }
109
+ ],
110
+ "Globals": [
111
+ {
112
+ "Name": "__const._ZN3aie6detail24add_sub_bits_impl_commonILj8EaLj64ELNS0_15AddSubOperationE0EE3runERKNS_6vectorIaLj64EEES7_.op",
113
+ "Size": 1,
114
+ "SoftFloat": false
115
+ }
116
+ ],
117
+ "UsesCmathStaticVars": false,
118
+ "Functions": [
119
+ {
120
+ "FunctionName": "void mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [7])",
121
+ "StackSize": 2612,
122
+ "SoftFloat": false
123
+ },
124
+ {
125
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
126
+ "StackSize": 80,
127
+ "SoftFloat": false
128
+ },
129
+ {
130
+ "FunctionName": "get_coreid()",
131
+ "StackSize": 0,
132
+ "SoftFloat": false
133
+ },
134
+ {
135
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
136
+ "StackSize": 2462,
137
+ "SoftFloat": false
138
+ },
139
+ {
140
+ "FunctionName": "me_primitive::read_coreid_()",
141
+ "StackSize": 0,
142
+ "SoftFloat": false
143
+ },
144
+ {
145
+ "FunctionName": "bfloat16* byte_incr<bfloat16>(bfloat16*, int)",
146
+ "StackSize": 8,
147
+ "SoftFloat": false
148
+ },
149
+ {
150
+ "FunctionName": "uint64* byte_incr<uint64>(uint64*, int)",
151
+ "StackSize": 8,
152
+ "SoftFloat": false
153
+ },
154
+ {
155
+ "FunctionName": "aie::mask<64u> aie_mask_gen<64u, uint64>(uint64)",
156
+ "StackSize": 60,
157
+ "SoftFloat": false
158
+ },
159
+ {
160
+ "FunctionName": "aie::vector<signed char, 64u>::vector()",
161
+ "StackSize": 136,
162
+ "SoftFloat": false
163
+ },
164
+ {
165
+ "FunctionName": "adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >::data() const",
166
+ "StackSize": 4,
167
+ "SoftFloat": false
168
+ },
169
+ {
170
+ "FunctionName": "adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >::data() const",
171
+ "StackSize": 4,
172
+ "SoftFloat": false
173
+ },
174
+ {
175
+ "FunctionName": "uint64 maskgen<uint64, 16u>(unsigned int, unsigned int)",
176
+ "StackSize": 40,
177
+ "SoftFloat": false
178
+ },
179
+ {
180
+ "FunctionName": "auto aie::detail::add_op::operator()<aie::vector<signed char, 64u>, aie::vector<signed char, 64u> >(aie::vector<signed char, 64u>, aie::vector<signed char, 64u>) const",
181
+ "StackSize": 748,
182
+ "SoftFloat": false
183
+ },
184
+ {
185
+ "FunctionName": "add(v64int8, v64int8)",
186
+ "StackSize": 424,
187
+ "SoftFloat": false
188
+ },
189
+ {
190
+ "FunctionName": "chessEnableIf<chessIsCompatible<chessRemoveQual<addr_t>::type, addr_t>::value&&chessIsCompatible<chessRemoveQual<addr_t>::type, addr_t>::value, uint64*>::type add_3d_byte_int<uint64, addr_t, addr_t>(uint64*, int, int, int, addr_t, addr_t, addr_t&, addr_t, addr_t, addr_t&)",
191
+ "StackSize": 52,
192
+ "SoftFloat": false
193
+ },
194
+ {
195
+ "FunctionName": "signed char AS5* add_2d_byte<signed char AS5>(signed char AS5*, int, int, addr_t&, int)",
196
+ "StackSize": 64,
197
+ "SoftFloat": false
198
+ },
199
+ {
200
+ "FunctionName": "uint64* add_3d_byte<uint64>(uint64*, int, int, addr_t&, int, int, addr_t&, int)",
201
+ "StackSize": 104,
202
+ "SoftFloat": false
203
+ },
204
+ {
205
+ "FunctionName": "signed char AS6* byte_incr<signed char AS6>(signed char AS6*, int)",
206
+ "StackSize": 8,
207
+ "SoftFloat": false
208
+ },
209
+ {
210
+ "FunctionName": "aie::mask<64u> aie::mask<64u>::from_uint64<>(uint64)",
211
+ "StackSize": 44,
212
+ "SoftFloat": false
213
+ },
214
+ {
215
+ "FunctionName": "aie::mask<64u>::mask(bool)",
216
+ "StackSize": 21,
217
+ "SoftFloat": false
218
+ },
219
+ {
220
+ "FunctionName": "void aie::mask<64u>::init_from_words64<0u>(uint64)",
221
+ "StackSize": 28,
222
+ "SoftFloat": false
223
+ },
224
+ {
225
+ "FunctionName": "std::__2::array<unsigned int, 2u>::operator[](unsigned int)",
226
+ "StackSize": 8,
227
+ "SoftFloat": false
228
+ },
229
+ {
230
+ "FunctionName": "std::__2::array<unsigned int, 2u>::operator[](unsigned int) const",
231
+ "StackSize": 8,
232
+ "SoftFloat": false
233
+ },
234
+ {
235
+ "FunctionName": "aie::detail::vector_base<signed char, 64u>::vector_base()",
236
+ "StackSize": 132,
237
+ "SoftFloat": false
238
+ },
239
+ {
240
+ "FunctionName": "aie::detail::vector_storage<signed char, 64u>::undef()",
241
+ "StackSize": 128,
242
+ "SoftFloat": false
243
+ },
244
+ {
245
+ "FunctionName": "undef_v64int8()",
246
+ "StackSize": 64,
247
+ "SoftFloat": false
248
+ },
249
+ {
250
+ "FunctionName": "auto aie::detail::load_vector<64u, (aie_dm_resource)0, signed char AS5>(signed char AS5 const*)",
251
+ "StackSize": 272,
252
+ "SoftFloat": false
253
+ },
254
+ {
255
+ "FunctionName": "aie::detail::load_vector_helper<signed char AS5, 64u, (aie_dm_resource)0>::run(signed char const AS5*)",
256
+ "StackSize": 204,
257
+ "SoftFloat": false
258
+ },
259
+ {
260
+ "FunctionName": "chessEnableIf<chessIsCompatible<chessRemoveQual<addr_t>::type, addr_t>::value, signed char AS5*>::type add_2d_byte_int<signed char AS5, addr_t>(signed char AS5*, int, int, addr_t, addr_t, addr_t&)",
261
+ "StackSize": 32,
262
+ "SoftFloat": false
263
+ },
264
+ {
265
+ "FunctionName": "addr_t::addr_t(int)",
266
+ "StackSize": 8,
267
+ "SoftFloat": false
268
+ },
269
+ {
270
+ "FunctionName": "aie::detail::shuffle_down_bits<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, unsigned int)",
271
+ "StackSize": 1062,
272
+ "SoftFloat": false
273
+ },
274
+ {
275
+ "FunctionName": "aie::detail::shuffle_down_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, unsigned int)",
276
+ "StackSize": 990,
277
+ "SoftFloat": false
278
+ },
279
+ {
280
+ "FunctionName": "shift_bytes(v64int8, v64int8, unsigned int)",
281
+ "StackSize": 594,
282
+ "SoftFloat": false
283
+ },
284
+ {
285
+ "FunctionName": "aie::vector<signed char, 64u>::operator v64int8() const",
286
+ "StackSize": 140,
287
+ "SoftFloat": false
288
+ },
289
+ {
290
+ "FunctionName": "aie::vector<signed char, 64u>::vector(v64int8)",
291
+ "StackSize": 136,
292
+ "SoftFloat": false
293
+ },
294
+ {
295
+ "FunctionName": "shiftx(v64int8, v64int8, int, unsigned int)",
296
+ "StackSize": 398,
297
+ "SoftFloat": false
298
+ },
299
+ {
300
+ "FunctionName": "me_primitive::shiftx(v64int8, v64int8, uint6_t, unsigned int)",
301
+ "StackSize": 197,
302
+ "SoftFloat": false
303
+ },
304
+ {
305
+ "FunctionName": "uint6_t::uint6_t(int)",
306
+ "StackSize": 8,
307
+ "SoftFloat": false
308
+ },
309
+ {
310
+ "FunctionName": "aie::vector<signed char, 64u>::to_native() const",
311
+ "StackSize": 72,
312
+ "SoftFloat": false
313
+ },
314
+ {
315
+ "FunctionName": "aie::detail::vector_base<signed char, 64u>::vector_base(v64int8)",
316
+ "StackSize": 68,
317
+ "SoftFloat": false
318
+ },
319
+ {
320
+ "FunctionName": "aie::detail::shuffle_up_bits<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, unsigned int)",
321
+ "StackSize": 1278,
322
+ "SoftFloat": false
323
+ },
324
+ {
325
+ "FunctionName": "aie::detail::shuffle_up_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, unsigned int)",
326
+ "StackSize": 1206,
327
+ "SoftFloat": false
328
+ },
329
+ {
330
+ "FunctionName": "aie::detail::shuffle_up_fill_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, aie::vector<signed char, 64u> const&, unsigned int)",
331
+ "StackSize": 1070,
332
+ "SoftFloat": false
333
+ },
334
+ {
335
+ "FunctionName": "aie::detail::shuffle_down_fill_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, aie::vector<signed char, 64u> const&, unsigned int)",
336
+ "StackSize": 994,
337
+ "SoftFloat": false
338
+ },
339
+ {
340
+ "FunctionName": "aie::mask<64u>::operator==(aie::mask<64u> const&) const",
341
+ "StackSize": 21,
342
+ "SoftFloat": false
343
+ },
344
+ {
345
+ "FunctionName": "aie::detail::select_bits<8u, signed char, 64u>::run(signed char const&, aie::vector<signed char, 64u> const&, aie::mask<64u> const&)",
346
+ "StackSize": 916,
347
+ "SoftFloat": false
348
+ },
349
+ {
350
+ "FunctionName": "aie::detail::select_bits_impl<8u, signed char, 64u>::run(signed char const&, aie::vector<signed char, 64u> const&, aie::mask<64u> const&)",
351
+ "StackSize": 840,
352
+ "SoftFloat": false
353
+ },
354
+ {
355
+ "FunctionName": "aie::detail::select_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, aie::vector<signed char, 64u> const&, aie::mask<64u> const&)",
356
+ "StackSize": 700,
357
+ "SoftFloat": false
358
+ },
359
+ {
360
+ "FunctionName": "aie::detail::broadcast_bits<8u, signed char, 64u>::run(signed char const&)",
361
+ "StackSize": 404,
362
+ "SoftFloat": false
363
+ },
364
+ {
365
+ "FunctionName": "sel(v64int8, v64int8, uint64)",
366
+ "StackSize": 432,
367
+ "SoftFloat": false
368
+ },
369
+ {
370
+ "FunctionName": "aie::mask<64u>::to_uint64(unsigned int) const",
371
+ "StackSize": 24,
372
+ "SoftFloat": false
373
+ },
374
+ {
375
+ "FunctionName": "chessEnableIf<chessIsCompatible<chessRemoveQual<mask64>::type, mask64>::value, v64int8>::type me_primitive::vadd8<mask64>(v64int8, v64int8, uint1_t, uint5_t, mask64, mask64&)",
376
+ "StackSize": 214,
377
+ "SoftFloat": false
378
+ },
379
+ {
380
+ "FunctionName": "uint1_t::uint1_t(int)",
381
+ "StackSize": 8,
382
+ "SoftFloat": false
383
+ },
384
+ {
385
+ "FunctionName": "uint5_t::uint5_t(int)",
386
+ "StackSize": 8,
387
+ "SoftFloat": false
388
+ },
389
+ {
390
+ "FunctionName": "mask64::mask64(uint64)",
391
+ "StackSize": 12,
392
+ "SoftFloat": false
393
+ },
394
+ {
395
+ "FunctionName": "std::__2::array<uint64, 1u>::operator[](unsigned int) const",
396
+ "StackSize": 8,
397
+ "SoftFloat": false
398
+ },
399
+ {
400
+ "FunctionName": "aie::detail::broadcast_bits_common_impl<8u, signed char, 64u>::run(signed char const&)",
401
+ "StackSize": 336,
402
+ "SoftFloat": false
403
+ },
404
+ {
405
+ "FunctionName": "aie::detail::(anonymous namespace)::native_broadcast<8u, signed char, 64u>::run(signed char)",
406
+ "StackSize": 133,
407
+ "SoftFloat": false
408
+ },
409
+ {
410
+ "FunctionName": "broadcast_to_v64int8(int)",
411
+ "StackSize": 68,
412
+ "SoftFloat": false
413
+ },
414
+ {
415
+ "FunctionName": "aie::detail::add_sub_bits<8u, signed char, 64u, (aie::detail::AddSubOperation)0>::run(aie::vector<signed char, 64u> const&, aie::vector<signed char, 64u> const&)",
416
+ "StackSize": 1021,
417
+ "SoftFloat": false
418
+ },
419
+ {
420
+ "FunctionName": "aie::detail::add_sub_bits_impl_common<8u, signed char, 64u, (aie::detail::AddSubOperation)0>::run(aie::vector<signed char, 64u> const&, aie::vector<signed char, 64u> const&)",
421
+ "StackSize": 949,
422
+ "SoftFloat": false
423
+ },
424
+ {
425
+ "FunctionName": "signed char AS6* aie::detail::store_vector<64u, (aie_dm_resource)0, signed char AS6, signed char>(signed char AS6*, aie::vector<signed char, 64u> const&)",
426
+ "StackSize": 32,
427
+ "SoftFloat": false
428
+ },
429
+ {
430
+ "FunctionName": "aie::detail::store_vector_helper<signed char AS6, 64u, (aie_dm_resource)0>::run(signed char AS6*, aie::vector<signed char, 64u> const&)",
431
+ "StackSize": 24,
432
+ "SoftFloat": false
433
+ }
434
+ ]
435
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_dependence_guidance.json ADDED
@@ -0,0 +1,403 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "DependenceAnalysisHints": [
3
+ {
4
+ "FunctionName": "void mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [7])",
5
+ "Var1": "lp.addr",
6
+ "ArgIndex1": "1",
7
+ "Var2": "arrayidx",
8
+ "ArgIndex2": "NotArgIndex"
9
+ },
10
+ {
11
+ "FunctionName": "void mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [7])",
12
+ "Var1": "lp.addr",
13
+ "ArgIndex1": "1",
14
+ "Var2": "arrayidx1",
15
+ "ArgIndex2": "NotArgIndex"
16
+ },
17
+ {
18
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
19
+ "Var1": "lp.addr",
20
+ "ArgIndex1": "0",
21
+ "Var2": "arrayidx",
22
+ "ArgIndex2": "NotArgIndex"
23
+ },
24
+ {
25
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
26
+ "Var1": "lp.addr",
27
+ "ArgIndex1": "0",
28
+ "Var2": "arrayidx1",
29
+ "ArgIndex2": "NotArgIndex"
30
+ },
31
+ {
32
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
33
+ "Var1": "lp.addr",
34
+ "ArgIndex1": "0",
35
+ "Var2": "arrayidx2",
36
+ "ArgIndex2": "NotArgIndex"
37
+ },
38
+ {
39
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
40
+ "Var1": "lp.addr",
41
+ "ArgIndex1": "0",
42
+ "Var2": "arrayidx3",
43
+ "ArgIndex2": "NotArgIndex"
44
+ },
45
+ {
46
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
47
+ "Var1": "lp.addr",
48
+ "ArgIndex1": "0",
49
+ "Var2": "arrayidx4",
50
+ "ArgIndex2": "NotArgIndex"
51
+ },
52
+ {
53
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
54
+ "Var1": "params.addr",
55
+ "ArgIndex1": "0",
56
+ "Var2": "dim_sv_c7",
57
+ "ArgIndex2": "NotArgIndex"
58
+ },
59
+ {
60
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
61
+ "Var1": "params.addr",
62
+ "ArgIndex1": "0",
63
+ "Var2": "dim_sv_c8",
64
+ "ArgIndex2": "NotArgIndex"
65
+ },
66
+ {
67
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
68
+ "Var1": "params.addr",
69
+ "ArgIndex1": "0",
70
+ "Var2": "dim_sv_c9",
71
+ "ArgIndex2": "NotArgIndex"
72
+ },
73
+ {
74
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
75
+ "Var1": "params.addr",
76
+ "ArgIndex1": "0",
77
+ "Var2": "sz_p025",
78
+ "ArgIndex2": "NotArgIndex"
79
+ },
80
+ {
81
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
82
+ "Var1": "params.addr",
83
+ "ArgIndex1": "0",
84
+ "Var2": "inc_p035",
85
+ "ArgIndex2": "NotArgIndex"
86
+ },
87
+ {
88
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
89
+ "Var1": "params.addr",
90
+ "ArgIndex1": "0",
91
+ "Var2": "sz_p036",
92
+ "ArgIndex2": "NotArgIndex"
93
+ },
94
+ {
95
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
96
+ "Var1": "params.addr",
97
+ "ArgIndex1": "0",
98
+ "Var2": "off_p037",
99
+ "ArgIndex2": "NotArgIndex"
100
+ },
101
+ {
102
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
103
+ "Var1": "params.addr",
104
+ "ArgIndex1": "0",
105
+ "Var2": "ini_p038",
106
+ "ArgIndex2": "NotArgIndex"
107
+ },
108
+ {
109
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
110
+ "Var1": "params.addr",
111
+ "ArgIndex1": "0",
112
+ "Var2": "sz2_p_m_final64",
113
+ "ArgIndex2": "NotArgIndex"
114
+ },
115
+ {
116
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
117
+ "Var1": "params.addr",
118
+ "ArgIndex1": "0",
119
+ "Var2": "inc2_p_m_final66",
120
+ "ArgIndex2": "NotArgIndex"
121
+ },
122
+ {
123
+ "FunctionName": "void setup_slice_hcwc8_params<bfloat16>(slice_hcwc8_params&, unsigned int const (&) [7])",
124
+ "Var1": "params.addr",
125
+ "ArgIndex1": "0",
126
+ "Var2": "ofm_offset68",
127
+ "ArgIndex2": "NotArgIndex"
128
+ },
129
+ {
130
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
131
+ "Var1": "params.addr",
132
+ "ArgIndex1": "1",
133
+ "Var2": "ofm_offset",
134
+ "ArgIndex2": "0"
135
+ },
136
+ {
137
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
138
+ "Var1": "params.addr",
139
+ "ArgIndex1": "1",
140
+ "Var2": "cd8_advance",
141
+ "ArgIndex2": "NotArgIndex"
142
+ },
143
+ {
144
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
145
+ "Var1": "params.addr",
146
+ "ArgIndex1": "1",
147
+ "Var2": "m_final0",
148
+ "ArgIndex2": "NotArgIndex"
149
+ },
150
+ {
151
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
152
+ "Var1": "params.addr",
153
+ "ArgIndex1": "1",
154
+ "Var2": "m_final1",
155
+ "ArgIndex2": "NotArgIndex"
156
+ },
157
+ {
158
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
159
+ "Var1": "params.addr",
160
+ "ArgIndex1": "1",
161
+ "Var2": "ofm_offset2",
162
+ "ArgIndex2": "0"
163
+ },
164
+ {
165
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
166
+ "Var1": "params.addr",
167
+ "ArgIndex1": "1",
168
+ "Var2": "ini_p0",
169
+ "ArgIndex2": "NotArgIndex"
170
+ },
171
+ {
172
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
173
+ "Var1": "params.addr",
174
+ "ArgIndex1": "1",
175
+ "Var2": "ini_p1",
176
+ "ArgIndex2": "NotArgIndex"
177
+ },
178
+ {
179
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
180
+ "Var1": "params.addr",
181
+ "ArgIndex1": "1",
182
+ "Var2": "m06",
183
+ "ArgIndex2": "NotArgIndex"
184
+ },
185
+ {
186
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
187
+ "Var1": "params.addr",
188
+ "ArgIndex1": "1",
189
+ "Var2": "m18",
190
+ "ArgIndex2": "NotArgIndex"
191
+ },
192
+ {
193
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
194
+ "Var1": "params.addr",
195
+ "ArgIndex1": "1",
196
+ "Var2": "main_loop_cnt",
197
+ "ArgIndex2": "NotArgIndex"
198
+ },
199
+ {
200
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
201
+ "Var1": "tmp",
202
+ "ArgIndex1": "NotArgIndex",
203
+ "Var2": "v0",
204
+ "ArgIndex2": "NotArgIndex"
205
+ },
206
+ {
207
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
208
+ "Var1": "params.addr",
209
+ "ArgIndex1": "1",
210
+ "Var2": "off_p0",
211
+ "ArgIndex2": "NotArgIndex"
212
+ },
213
+ {
214
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
215
+ "Var1": "params.addr",
216
+ "ArgIndex1": "1",
217
+ "Var2": "sz_p0",
218
+ "ArgIndex2": "NotArgIndex"
219
+ },
220
+ {
221
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
222
+ "Var1": "params.addr",
223
+ "ArgIndex1": "1",
224
+ "Var2": "inc_p0",
225
+ "ArgIndex2": "NotArgIndex"
226
+ },
227
+ {
228
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
229
+ "Var1": "tmp17",
230
+ "ArgIndex1": "NotArgIndex",
231
+ "Var2": "v1",
232
+ "ArgIndex2": "NotArgIndex"
233
+ },
234
+ {
235
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
236
+ "Var1": "params.addr",
237
+ "ArgIndex1": "1",
238
+ "Var2": "off_p1",
239
+ "ArgIndex2": "NotArgIndex"
240
+ },
241
+ {
242
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
243
+ "Var1": "params.addr",
244
+ "ArgIndex1": "1",
245
+ "Var2": "sz_p1",
246
+ "ArgIndex2": "NotArgIndex"
247
+ },
248
+ {
249
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
250
+ "Var1": "params.addr",
251
+ "ArgIndex1": "1",
252
+ "Var2": "inc_p1",
253
+ "ArgIndex2": "NotArgIndex"
254
+ },
255
+ {
256
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
257
+ "Var1": "params.addr",
258
+ "ArgIndex1": "1",
259
+ "Var2": "p0_down_shuffle",
260
+ "ArgIndex2": "NotArgIndex"
261
+ },
262
+ {
263
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
264
+ "Var1": "tmp20",
265
+ "ArgIndex1": "NotArgIndex",
266
+ "Var2": "v0_s",
267
+ "ArgIndex2": "NotArgIndex"
268
+ },
269
+ {
270
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
271
+ "Var1": "params.addr",
272
+ "ArgIndex1": "1",
273
+ "Var2": "p1_up_shuffle",
274
+ "ArgIndex2": "NotArgIndex"
275
+ },
276
+ {
277
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
278
+ "Var1": "tmp22",
279
+ "ArgIndex1": "NotArgIndex",
280
+ "Var2": "v1_s",
281
+ "ArgIndex2": "NotArgIndex"
282
+ },
283
+ {
284
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
285
+ "Var1": "tmp24",
286
+ "ArgIndex1": "NotArgIndex",
287
+ "Var2": "v0_m",
288
+ "ArgIndex2": "NotArgIndex"
289
+ },
290
+ {
291
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
292
+ "Var1": "tmp26",
293
+ "ArgIndex1": "NotArgIndex",
294
+ "Var2": "v1_m",
295
+ "ArgIndex2": "NotArgIndex"
296
+ },
297
+ {
298
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
299
+ "Var1": "tmp28",
300
+ "ArgIndex1": "NotArgIndex",
301
+ "Var2": "vadd",
302
+ "ArgIndex2": "NotArgIndex"
303
+ },
304
+ {
305
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
306
+ "Var1": "params.addr",
307
+ "ArgIndex1": "1",
308
+ "Var2": "off_p_m_final",
309
+ "ArgIndex2": "NotArgIndex"
310
+ },
311
+ {
312
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
313
+ "Var1": "params.addr",
314
+ "ArgIndex1": "1",
315
+ "Var2": "sz1_p_m_final",
316
+ "ArgIndex2": "NotArgIndex"
317
+ },
318
+ {
319
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
320
+ "Var1": "params.addr",
321
+ "ArgIndex1": "1",
322
+ "Var2": "inc1_p_m_final",
323
+ "ArgIndex2": "NotArgIndex"
324
+ },
325
+ {
326
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
327
+ "Var1": "params.addr",
328
+ "ArgIndex1": "1",
329
+ "Var2": "sz2_p_m_final",
330
+ "ArgIndex2": "NotArgIndex"
331
+ },
332
+ {
333
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
334
+ "Var1": "params.addr",
335
+ "ArgIndex1": "1",
336
+ "Var2": "inc2_p_m_final",
337
+ "ArgIndex2": "NotArgIndex"
338
+ },
339
+ {
340
+ "FunctionName": "void slice_hcwc8<bfloat16>(bfloat16*, bfloat16*, slice_hcwc8_params&)",
341
+ "Var1": "tmp32",
342
+ "ArgIndex1": "NotArgIndex",
343
+ "Var2": "vadd_m",
344
+ "ArgIndex2": "NotArgIndex"
345
+ },
346
+ {
347
+ "FunctionName": "uint64* add_3d_byte<uint64>(uint64*, int, int, addr_t&, int, int, addr_t&, int)",
348
+ "Var1": "c2",
349
+ "ArgIndex1": "NotArgIndex",
350
+ "Var2": "c",
351
+ "ArgIndex2": "NotArgIndex"
352
+ },
353
+ {
354
+ "FunctionName": "aie::detail::shuffle_down_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, unsigned int)",
355
+ "Var1": "tmp",
356
+ "ArgIndex1": "NotArgIndex",
357
+ "Var2": "ret",
358
+ "ArgIndex2": "NotArgIndex"
359
+ },
360
+ {
361
+ "FunctionName": "aie::detail::shuffle_down_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, unsigned int)",
362
+ "Var1": "ret",
363
+ "ArgIndex1": "NotArgIndex",
364
+ "Var2": "retval",
365
+ "ArgIndex2": "0"
366
+ },
367
+ {
368
+ "FunctionName": "_ZNK3aie6detail11vector_baseIaLj64EE9to_nativeEvQleclL_ZNS0_11vector_base4bitsEvEELi1024E",
369
+ "Var1": "this.addr",
370
+ "ArgIndex1": "0",
371
+ "Var2": "data",
372
+ "ArgIndex2": "NotArgIndex"
373
+ },
374
+ {
375
+ "FunctionName": "aie::detail::vector_base<signed char, 64u>::vector_base(v64int8)",
376
+ "Var1": "data",
377
+ "ArgIndex1": "NotArgIndex",
378
+ "Var2": "data2",
379
+ "ArgIndex2": "NotArgIndex"
380
+ },
381
+ {
382
+ "FunctionName": "aie::detail::shuffle_down_fill_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, aie::vector<signed char, 64u> const&, unsigned int)",
383
+ "Var1": "tmp",
384
+ "ArgIndex1": "NotArgIndex",
385
+ "Var2": "ret",
386
+ "ArgIndex2": "NotArgIndex"
387
+ },
388
+ {
389
+ "FunctionName": "aie::detail::shuffle_down_fill_bits_impl<8u, signed char, 64u>::run(aie::vector<signed char, 64u> const&, aie::vector<signed char, 64u> const&, unsigned int)",
390
+ "Var1": "ret",
391
+ "ArgIndex1": "NotArgIndex",
392
+ "Var2": "retval",
393
+ "ArgIndex2": "0"
394
+ },
395
+ {
396
+ "FunctionName": "_ZNK3aie6detail11vector_baseIaLj64EE5storeIL15aie_dm_resource0EU3AS6aQsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPT0_",
397
+ "Var1": "this.addr",
398
+ "ArgIndex1": "0",
399
+ "Var2": "data",
400
+ "ArgIndex2": "NotArgIndex"
401
+ }
402
+ ]
403
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_results.json ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ModulePath": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper.cpp",
3
+ "KernelSourcePath": "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/slice_adf_wrapper.cpp",
4
+ "UseCases": [
5
+ {
6
+ "Index": 0,
7
+ "KernelFunction": "mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>",
8
+ "InitializationFunction": "",
9
+ "KernelClassCtor": "",
10
+ "Instances": [
11
+ "i852",
12
+ "i853",
13
+ "i854",
14
+ "i855",
15
+ "i857",
16
+ "i858",
17
+ "i859",
18
+ "i860",
19
+ "i862",
20
+ "i863",
21
+ "i864",
22
+ "i865",
23
+ "i867",
24
+ "i868",
25
+ "i869",
26
+ "i870",
27
+ "i874",
28
+ "i875",
29
+ "i876",
30
+ "i877",
31
+ "i879",
32
+ "i880",
33
+ "i881",
34
+ "i882",
35
+ "i884",
36
+ "i885",
37
+ "i886",
38
+ "i887",
39
+ "i889",
40
+ "i890",
41
+ "i891",
42
+ "i892",
43
+ "i919",
44
+ "i920",
45
+ "i921",
46
+ "i922",
47
+ "i924",
48
+ "i925",
49
+ "i926",
50
+ "i927",
51
+ "i929",
52
+ "i930",
53
+ "i931",
54
+ "i932",
55
+ "i934",
56
+ "i935",
57
+ "i936",
58
+ "i937",
59
+ "i941",
60
+ "i942",
61
+ "i943",
62
+ "i944",
63
+ "i946",
64
+ "i947",
65
+ "i948",
66
+ "i949",
67
+ "i951",
68
+ "i952",
69
+ "i953",
70
+ "i954",
71
+ "i956",
72
+ "i957",
73
+ "i958",
74
+ "i959",
75
+ "i1057",
76
+ "i1058",
77
+ "i1059",
78
+ "i1060",
79
+ "i1062",
80
+ "i1063",
81
+ "i1064",
82
+ "i1065",
83
+ "i1067",
84
+ "i1068",
85
+ "i1069",
86
+ "i1070",
87
+ "i1072",
88
+ "i1073",
89
+ "i1074",
90
+ "i1075",
91
+ "i1079",
92
+ "i1080",
93
+ "i1081",
94
+ "i1082",
95
+ "i1084",
96
+ "i1085",
97
+ "i1086",
98
+ "i1087",
99
+ "i1089",
100
+ "i1090",
101
+ "i1091",
102
+ "i1092",
103
+ "i1094",
104
+ "i1095",
105
+ "i1096",
106
+ "i1097"
107
+ ]
108
+ }
109
+ ],
110
+ "AccessRecords": [],
111
+ "ControlRegsUsage": {
112
+ "RndRecords": {},
113
+ "SatRecords": {},
114
+ "SymSatRecords": {}
115
+ },
116
+ "ParameterLoads": {
117
+ "__regcall3__chessintr___Pvoid_add_2d_byte_int___Pvoid___sint___sint_addr_t_addr_t_addr_t": [
118
+ "may",
119
+ "may",
120
+ "may",
121
+ "may",
122
+ "may",
123
+ "may"
124
+ ],
125
+ "__regcall3__chessintr___Pvoid_add_3d_byte_int___Pvoid___sint___sint___sint_addr_t_addr_t_addr_t_addr_t_addr_t_addr_t": [
126
+ "may",
127
+ "may",
128
+ "may",
129
+ "may",
130
+ "may",
131
+ "may",
132
+ "may",
133
+ "may",
134
+ "may",
135
+ "may"
136
+ ],
137
+ "__regcall3__chessintr___Pvoid_byte_incr___Pvoid___sint": [
138
+ "may",
139
+ "may"
140
+ ],
141
+ "__regcall3__chessintr___sint_read_coreid_": [],
142
+ "__regcall3__chessintr_addr_t_addr_t___sint": [
143
+ "may"
144
+ ],
145
+ "__regcall3__chessintr_mask64_mask64___ulonglong": [
146
+ "may"
147
+ ],
148
+ "__regcall3__chessintr_uint1_t_uint1_t___sint": [
149
+ "may"
150
+ ],
151
+ "__regcall3__chessintr_uint5_t_uint5_t___sint": [
152
+ "may"
153
+ ],
154
+ "__regcall3__chessintr_uint6_t_uint6_t___sint": [
155
+ "may"
156
+ ],
157
+ "__regcall3__chessintr_v64int8_broadcast_to_v64int8___sint": [
158
+ "may"
159
+ ],
160
+ "__regcall3__chessintr_v64int8_shiftx_v64int8_v64int8_uint6_t___uint": [
161
+ "may",
162
+ "may",
163
+ "may",
164
+ "may"
165
+ ],
166
+ "__regcall3__chessintr_v64int8_undef_v64int8": [],
167
+ "__regcall3__chessintr_v64int8_vadd8_v64int8_v64int8_uint1_t_uint5_t_mask64_mask64": [
168
+ "may",
169
+ "may",
170
+ "may",
171
+ "may",
172
+ "may"
173
+ ],
174
+ "add_3d_byte<uint64>": [
175
+ "may",
176
+ "may",
177
+ "may",
178
+ "sometimes",
179
+ "may",
180
+ "may",
181
+ "sometimes",
182
+ "may"
183
+ ],
184
+ "aie_mask_gen<64U, uint64>": [
185
+ "may"
186
+ ],
187
+ "llvm.assume": [
188
+ "may"
189
+ ],
190
+ "llvm.chess.copy.p5": [
191
+ "may"
192
+ ],
193
+ "llvm.chess.copy.p6": [
194
+ "may"
195
+ ],
196
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.addr_ts.i32.p1": [
197
+ "may",
198
+ "may",
199
+ "may",
200
+ "may",
201
+ "may",
202
+ "may",
203
+ "may"
204
+ ],
205
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint1_ts.i32.p1": [
206
+ "may",
207
+ "may",
208
+ "may",
209
+ "may",
210
+ "may",
211
+ "may",
212
+ "may"
213
+ ],
214
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint5_ts.i32.p1": [
215
+ "may",
216
+ "may",
217
+ "may",
218
+ "may",
219
+ "may",
220
+ "may",
221
+ "may"
222
+ ],
223
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint6_ts.i32.p1": [
224
+ "may",
225
+ "may",
226
+ "may",
227
+ "may",
228
+ "may",
229
+ "may",
230
+ "may"
231
+ ],
232
+ "llvm.chess.init.customint.s_struct.mask64s.i64.p1": [
233
+ "may",
234
+ "may",
235
+ "may",
236
+ "may",
237
+ "may",
238
+ "may",
239
+ "may"
240
+ ],
241
+ "llvm.chess_error": [
242
+ "may"
243
+ ],
244
+ "llvm.chess_manifest": [
245
+ "may"
246
+ ],
247
+ "llvm.dbg.declare": [
248
+ "may",
249
+ "may",
250
+ "may"
251
+ ],
252
+ "llvm.dbg.value": [
253
+ "may",
254
+ "may",
255
+ "may"
256
+ ],
257
+ "llvm.is.constant.i1": [
258
+ "may"
259
+ ],
260
+ "llvm.lifetime.end.p0": [
261
+ "may",
262
+ "may"
263
+ ],
264
+ "llvm.lifetime.start.p0": [
265
+ "may",
266
+ "may"
267
+ ],
268
+ "llvm.memcpy.p0.p0.i32": [
269
+ "may",
270
+ "may",
271
+ "may",
272
+ "may"
273
+ ],
274
+ "llvm.memset.p0.i32": [
275
+ "may",
276
+ "may",
277
+ "may",
278
+ "may"
279
+ ],
280
+ "llvm.noalias.decl.p0.p0.i32": [
281
+ "may",
282
+ "may",
283
+ "may"
284
+ ],
285
+ "llvm.noalias.p0.p0.p0.i32": [
286
+ "may",
287
+ "may",
288
+ "may",
289
+ "may",
290
+ "may"
291
+ ],
292
+ "llvm.noalias.p5.p0.p0.i32": [
293
+ "may",
294
+ "may",
295
+ "may",
296
+ "may",
297
+ "may"
298
+ ],
299
+ "llvm.noalias.p6.p0.p0.i32": [
300
+ "may",
301
+ "may",
302
+ "may",
303
+ "may",
304
+ "may"
305
+ ],
306
+ "operator()<aie::vector<signed char, 64U>, aie::vector<signed char, 64U> >": [
307
+ "no",
308
+ "may",
309
+ "may"
310
+ ],
311
+ "run": [
312
+ "sometimes",
313
+ "sometimes",
314
+ "may"
315
+ ],
316
+ "setup_slice_hcwc8_params<bfloat16>": [
317
+ "sometimes",
318
+ "sometimes"
319
+ ],
320
+ "slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> > >": [
321
+ "sometimes",
322
+ "sometimes",
323
+ "sometimes"
324
+ ],
325
+ "slice_hcwc8<bfloat16>": [
326
+ "may",
327
+ "may",
328
+ "sometimes"
329
+ ]
330
+ }
331
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper_spec.json ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "KernelAnalysisSpec": {
3
+ "ModulePath": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i852_wrap_slice_adf_wrapper.cpp",
4
+ "KernelSourcePath": "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/slice_adf_wrapper.cpp",
5
+ "SpecFile": "i852_wrap_slice_adf_wrapper_spec.json",
6
+ "ResultFile": "i852_wrap_slice_adf_wrapper_results.json",
7
+ "UseCases": [
8
+ {
9
+ "Index": 0,
10
+ "KernelFunction": "mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>",
11
+ "InitializationFunction": "",
12
+ "KernelClassCtor": "",
13
+ "Instances": [
14
+ "i852",
15
+ "i853",
16
+ "i854",
17
+ "i855",
18
+ "i857",
19
+ "i858",
20
+ "i859",
21
+ "i860",
22
+ "i862",
23
+ "i863",
24
+ "i864",
25
+ "i865",
26
+ "i867",
27
+ "i868",
28
+ "i869",
29
+ "i870",
30
+ "i874",
31
+ "i875",
32
+ "i876",
33
+ "i877",
34
+ "i879",
35
+ "i880",
36
+ "i881",
37
+ "i882",
38
+ "i884",
39
+ "i885",
40
+ "i886",
41
+ "i887",
42
+ "i889",
43
+ "i890",
44
+ "i891",
45
+ "i892",
46
+ "i919",
47
+ "i920",
48
+ "i921",
49
+ "i922",
50
+ "i924",
51
+ "i925",
52
+ "i926",
53
+ "i927",
54
+ "i929",
55
+ "i930",
56
+ "i931",
57
+ "i932",
58
+ "i934",
59
+ "i935",
60
+ "i936",
61
+ "i937",
62
+ "i941",
63
+ "i942",
64
+ "i943",
65
+ "i944",
66
+ "i946",
67
+ "i947",
68
+ "i948",
69
+ "i949",
70
+ "i951",
71
+ "i952",
72
+ "i953",
73
+ "i954",
74
+ "i956",
75
+ "i957",
76
+ "i958",
77
+ "i959",
78
+ "i1057",
79
+ "i1058",
80
+ "i1059",
81
+ "i1060",
82
+ "i1062",
83
+ "i1063",
84
+ "i1064",
85
+ "i1065",
86
+ "i1067",
87
+ "i1068",
88
+ "i1069",
89
+ "i1070",
90
+ "i1072",
91
+ "i1073",
92
+ "i1074",
93
+ "i1075",
94
+ "i1079",
95
+ "i1080",
96
+ "i1081",
97
+ "i1082",
98
+ "i1084",
99
+ "i1085",
100
+ "i1086",
101
+ "i1087",
102
+ "i1089",
103
+ "i1090",
104
+ "i1091",
105
+ "i1092",
106
+ "i1094",
107
+ "i1095",
108
+ "i1096",
109
+ "i1097"
110
+ ]
111
+ }
112
+ ]
113
+ }
114
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper.cpp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ #include "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/concat_adf_wrapper.cpp"
2
+ template void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[8]);
3
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_analysis.json ADDED
@@ -0,0 +1,278 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ModuleName": "i897_wrap_concat_adf_wrapper",
3
+ "SourceFileName": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper.cpp",
4
+ "StructTypes": [
5
+ {
6
+ "Name": "struct.ipd.custom_type.bfloat16",
7
+ "Size": 2
8
+ },
9
+ {
10
+ "Name": "struct.ipd.custom_type.uint2_t",
11
+ "Size": 1
12
+ },
13
+ {
14
+ "Name": "struct.ipd.custom_type.uint4_t",
15
+ "Size": 1
16
+ },
17
+ {
18
+ "Name": "class.aie::tile",
19
+ "Size": 1
20
+ },
21
+ {
22
+ "Name": "class.aie::detail::tile",
23
+ "Size": 1
24
+ },
25
+ {
26
+ "Name": "class.aie::vector",
27
+ "Size": 64
28
+ },
29
+ {
30
+ "Name": "class.aie::detail::vector_base",
31
+ "Size": 64
32
+ },
33
+ {
34
+ "Name": "struct.v32bfloat16",
35
+ "Size": 64
36
+ },
37
+ {
38
+ "Name": "struct.ipd.custom_type.v128int4",
39
+ "Size": 64
40
+ },
41
+ {
42
+ "Name": "struct.adf::detail::io_buffer_base",
43
+ "Size": 4
44
+ },
45
+ {
46
+ "Name": "struct.v32int16",
47
+ "Size": 64
48
+ },
49
+ {
50
+ "Name": "struct.ipd.custom_type.tm_byte_t",
51
+ "Size": 1
52
+ },
53
+ {
54
+ "Name": "vector_base<bfloat16, 32U>",
55
+ "Size": 64
56
+ },
57
+ {
58
+ "Name": "io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> > >",
59
+ "Size": 0
60
+ },
61
+ {
62
+ "Name": "io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> > >",
63
+ "Size": 0
64
+ },
65
+ {
66
+ "Name": "vector<bfloat16, 32U>",
67
+ "Size": 64
68
+ },
69
+ {
70
+ "Name": "tile",
71
+ "Size": 0
72
+ }
73
+ ],
74
+ "Globals": [
75
+ {
76
+ "Name": "ns_concat::kernel_iter",
77
+ "MangledName": "_ZN9ns_concatL11kernel_iterE",
78
+ "Size": 4,
79
+ "SoftFloat": false
80
+ },
81
+ {
82
+ "Name": "ns_concat::core_id",
83
+ "MangledName": "_ZN9ns_concatL7core_idE",
84
+ "Size": 4,
85
+ "SoftFloat": false
86
+ },
87
+ {
88
+ "Name": "ns_concat::core_col",
89
+ "MangledName": "_ZN9ns_concatL8core_colE",
90
+ "Size": 4,
91
+ "SoftFloat": false
92
+ },
93
+ {
94
+ "Name": "ns_concat::core_row",
95
+ "MangledName": "_ZN9ns_concatL8core_rowE",
96
+ "Size": 4,
97
+ "SoftFloat": false
98
+ }
99
+ ],
100
+ "UsesCmathStaticVars": false,
101
+ "Functions": [
102
+ {
103
+ "FunctionName": "aie::tile::current()",
104
+ "StackSize": 11,
105
+ "SoftFloat": false
106
+ },
107
+ {
108
+ "FunctionName": "aie::tile::set_saturation(aie::saturation_mode)",
109
+ "StackSize": 29,
110
+ "SoftFloat": false
111
+ },
112
+ {
113
+ "FunctionName": "aie::tile::set_rounding(aie::rounding_mode)",
114
+ "StackSize": 29,
115
+ "SoftFloat": false
116
+ },
117
+ {
118
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
119
+ "StackSize": 812,
120
+ "SoftFloat": false
121
+ },
122
+ {
123
+ "FunctionName": "concat_adf_init()",
124
+ "StackSize": 33,
125
+ "SoftFloat": false
126
+ },
127
+ {
128
+ "FunctionName": "bfloat16 AS6* byte_incr<bfloat16 AS6>(bfloat16 AS6*, int)",
129
+ "StackSize": 8,
130
+ "SoftFloat": false
131
+ },
132
+ {
133
+ "FunctionName": "get_coreid()",
134
+ "StackSize": 0,
135
+ "SoftFloat": false
136
+ },
137
+ {
138
+ "FunctionName": "adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >::data() const",
139
+ "StackSize": 4,
140
+ "SoftFloat": false
141
+ },
142
+ {
143
+ "FunctionName": "adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >::data() const",
144
+ "StackSize": 4,
145
+ "SoftFloat": false
146
+ },
147
+ {
148
+ "FunctionName": "bfloat16 AS5* byte_incr<bfloat16 AS5>(bfloat16 AS5*, int)",
149
+ "StackSize": 8,
150
+ "SoftFloat": false
151
+ },
152
+ {
153
+ "FunctionName": "aie::detail::tile::current()",
154
+ "StackSize": 5,
155
+ "SoftFloat": false
156
+ },
157
+ {
158
+ "FunctionName": "aie::tile::tile(aie::detail::tile const&)",
159
+ "StackSize": 8,
160
+ "SoftFloat": false
161
+ },
162
+ {
163
+ "FunctionName": "aie::detail::tile::tile()",
164
+ "StackSize": 4,
165
+ "SoftFloat": false
166
+ },
167
+ {
168
+ "FunctionName": "aie::detail::tile::set_saturation(aie::saturation_mode)",
169
+ "StackSize": 21,
170
+ "SoftFloat": false
171
+ },
172
+ {
173
+ "FunctionName": "set_satmode(unsigned int)",
174
+ "StackSize": 13,
175
+ "SoftFloat": false
176
+ },
177
+ {
178
+ "FunctionName": "uint2_t::uint2_t(unsigned int)",
179
+ "StackSize": 8,
180
+ "SoftFloat": false
181
+ },
182
+ {
183
+ "FunctionName": "aie::detail::tile::set_rounding(aie::rounding_mode)",
184
+ "StackSize": 21,
185
+ "SoftFloat": false
186
+ },
187
+ {
188
+ "FunctionName": "set_rnd(unsigned int)",
189
+ "StackSize": 13,
190
+ "SoftFloat": false
191
+ },
192
+ {
193
+ "FunctionName": "uint4_t::uint4_t(unsigned int)",
194
+ "StackSize": 8,
195
+ "SoftFloat": false
196
+ },
197
+ {
198
+ "FunctionName": "me_primitive::read_coreid_()",
199
+ "StackSize": 0,
200
+ "SoftFloat": false
201
+ },
202
+ {
203
+ "FunctionName": "aie::detail::zeros_bits<16u, bfloat16, 32u>::run()",
204
+ "StackSize": 592,
205
+ "SoftFloat": false
206
+ },
207
+ {
208
+ "FunctionName": "aie::detail::zeros_bits_common_impl<16u, bfloat16, 32u>::run()",
209
+ "StackSize": 528,
210
+ "SoftFloat": false
211
+ },
212
+ {
213
+ "FunctionName": "aie::vector<bfloat16, 32u>::vector()",
214
+ "StackSize": 136,
215
+ "SoftFloat": false
216
+ },
217
+ {
218
+ "FunctionName": "aie::detail::(anonymous namespace)::native_broadcast<16u, bfloat16, 32u>::run_zeros()",
219
+ "StackSize": 332,
220
+ "SoftFloat": false
221
+ },
222
+ {
223
+ "FunctionName": "aie::vector<bfloat16, 32u>::vector(v32bfloat16)",
224
+ "StackSize": 136,
225
+ "SoftFloat": false
226
+ },
227
+ {
228
+ "FunctionName": "aie::detail::vector_base<bfloat16, 32u>::vector_base()",
229
+ "StackSize": 132,
230
+ "SoftFloat": false
231
+ },
232
+ {
233
+ "FunctionName": "aie::detail::vector_storage<bfloat16, 32u>::undef()",
234
+ "StackSize": 128,
235
+ "SoftFloat": false
236
+ },
237
+ {
238
+ "FunctionName": "undef_v32bfloat16()",
239
+ "StackSize": 64,
240
+ "SoftFloat": false
241
+ },
242
+ {
243
+ "FunctionName": "broadcast_zero_to_v32int16()",
244
+ "StackSize": 132,
245
+ "SoftFloat": false
246
+ },
247
+ {
248
+ "FunctionName": "v32bfloat16::v32bfloat16(v32int16)",
249
+ "StackSize": 204,
250
+ "SoftFloat": false
251
+ },
252
+ {
253
+ "FunctionName": "broadcast_s16(int)",
254
+ "StackSize": 68,
255
+ "SoftFloat": false
256
+ },
257
+ {
258
+ "FunctionName": "v32bfloat16::v32bfloat16(chessllvmInternal, v128int4)",
259
+ "StackSize": 72,
260
+ "SoftFloat": false
261
+ },
262
+ {
263
+ "FunctionName": "aie::detail::vector_base<bfloat16, 32u>::vector_base(v32bfloat16)",
264
+ "StackSize": 68,
265
+ "SoftFloat": false
266
+ },
267
+ {
268
+ "FunctionName": "bfloat16 AS7* aie::detail::store_vector<32u, (aie_dm_resource)0, bfloat16 AS7, bfloat16>(bfloat16 AS7*, aie::vector<bfloat16, 32u> const&)",
269
+ "StackSize": 32,
270
+ "SoftFloat": false
271
+ },
272
+ {
273
+ "FunctionName": "aie::detail::store_vector_helper<bfloat16 AS7, 32u, (aie_dm_resource)0>::run(bfloat16 AS7*, aie::vector<bfloat16, 32u> const&)",
274
+ "StackSize": 24,
275
+ "SoftFloat": false
276
+ }
277
+ ]
278
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_dependence_guidance.json ADDED
@@ -0,0 +1,158 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "DependenceAnalysisHints": [
3
+ {
4
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
5
+ "Var1": "layer_params.addr",
6
+ "ArgIndex1": "2",
7
+ "Var2": "arrayidx",
8
+ "ArgIndex2": "NotArgIndex"
9
+ },
10
+ {
11
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
12
+ "Var1": "layer_params.addr",
13
+ "ArgIndex1": "2",
14
+ "Var2": "arrayidx5",
15
+ "ArgIndex2": "NotArgIndex"
16
+ },
17
+ {
18
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
19
+ "Var1": "layer_params.addr",
20
+ "ArgIndex1": "2",
21
+ "Var2": "arrayidx6",
22
+ "ArgIndex2": "NotArgIndex"
23
+ },
24
+ {
25
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
26
+ "Var1": "layer_params.addr",
27
+ "ArgIndex1": "2",
28
+ "Var2": "arrayidx7",
29
+ "ArgIndex2": "NotArgIndex"
30
+ },
31
+ {
32
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
33
+ "Var1": "layer_params.addr",
34
+ "ArgIndex1": "2",
35
+ "Var2": "arrayidx8",
36
+ "ArgIndex2": "NotArgIndex"
37
+ },
38
+ {
39
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
40
+ "Var1": "layer_params.addr",
41
+ "ArgIndex1": "2",
42
+ "Var2": "arrayidx9",
43
+ "ArgIndex2": "NotArgIndex"
44
+ },
45
+ {
46
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
47
+ "Var1": "layer_params.addr",
48
+ "ArgIndex1": "2",
49
+ "Var2": "arrayidx10",
50
+ "ArgIndex2": "NotArgIndex"
51
+ },
52
+ {
53
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
54
+ "Var1": "layer_params.addr",
55
+ "ArgIndex1": "2",
56
+ "Var2": "arrayidx11",
57
+ "ArgIndex2": "NotArgIndex"
58
+ },
59
+ {
60
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
61
+ "Var1": "i31",
62
+ "ArgIndex1": "NotArgIndex",
63
+ "Var2": "arrayidx42",
64
+ "ArgIndex2": "NotArgIndex"
65
+ },
66
+ {
67
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
68
+ "Var1": "in1_dim_3",
69
+ "ArgIndex1": "NotArgIndex",
70
+ "Var2": "arrayidx42",
71
+ "ArgIndex2": "NotArgIndex"
72
+ },
73
+ {
74
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
75
+ "Var1": "j",
76
+ "ArgIndex1": "NotArgIndex",
77
+ "Var2": "arrayidx42",
78
+ "ArgIndex2": "NotArgIndex"
79
+ },
80
+ {
81
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
82
+ "Var1": "arrayidx42",
83
+ "ArgIndex1": "NotArgIndex",
84
+ "Var2": "arrayidx45",
85
+ "ArgIndex2": "NotArgIndex"
86
+ },
87
+ {
88
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
89
+ "Var1": "i31",
90
+ "ArgIndex1": "NotArgIndex",
91
+ "Var2": "arrayidx55",
92
+ "ArgIndex2": "NotArgIndex"
93
+ },
94
+ {
95
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
96
+ "Var1": "in2_dim_3",
97
+ "ArgIndex1": "NotArgIndex",
98
+ "Var2": "arrayidx55",
99
+ "ArgIndex2": "NotArgIndex"
100
+ },
101
+ {
102
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
103
+ "Var1": "n",
104
+ "ArgIndex1": "NotArgIndex",
105
+ "Var2": "arrayidx55",
106
+ "ArgIndex2": "NotArgIndex"
107
+ },
108
+ {
109
+ "FunctionName": "void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0u> > >&, unsigned int const (&) [8])",
110
+ "Var1": "arrayidx55",
111
+ "ArgIndex1": "NotArgIndex",
112
+ "Var2": "arrayidx59",
113
+ "ArgIndex2": "NotArgIndex"
114
+ },
115
+ {
116
+ "FunctionName": "set_satmode(unsigned int)",
117
+ "Var1": "tmp",
118
+ "ArgIndex1": "NotArgIndex",
119
+ "Var2": "_ZN12me_primitive11control_satE",
120
+ "ArgIndex2": "NotArgIndex"
121
+ },
122
+ {
123
+ "FunctionName": "set_rnd(unsigned int)",
124
+ "Var1": "tmp",
125
+ "ArgIndex1": "NotArgIndex",
126
+ "Var2": "_ZN12me_primitive11control_rndE",
127
+ "ArgIndex2": "NotArgIndex"
128
+ },
129
+ {
130
+ "FunctionName": "v32bfloat16::v32bfloat16(v32int16)",
131
+ "Var1": "tmp",
132
+ "ArgIndex1": "NotArgIndex",
133
+ "Var2": "this1",
134
+ "ArgIndex2": "0"
135
+ },
136
+ {
137
+ "FunctionName": "v32bfloat16::v32bfloat16(chessllvmInternal, v128int4)",
138
+ "Var1": "aw",
139
+ "ArgIndex1": "NotArgIndex",
140
+ "Var2": "mw",
141
+ "ArgIndex2": "NotArgIndex"
142
+ },
143
+ {
144
+ "FunctionName": "aie::detail::vector_base<bfloat16, 32u>::vector_base(v32bfloat16)",
145
+ "Var1": "data",
146
+ "ArgIndex1": "NotArgIndex",
147
+ "Var2": "data2",
148
+ "ArgIndex2": "NotArgIndex"
149
+ },
150
+ {
151
+ "FunctionName": "_ZNK3aie6detail11vector_baseI8bfloat16Lj32EE5storeIL15aie_dm_resource0EU3AS7S2_Qsr3stdE9is_same_vIN22aie_dm_resource_removeITL0_0_E4typeET_EEEvPT0_",
152
+ "Var1": "this.addr",
153
+ "ArgIndex1": "0",
154
+ "Var2": "data",
155
+ "ArgIndex2": "NotArgIndex"
156
+ }
157
+ ]
158
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_results.json ADDED
@@ -0,0 +1,176 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ModulePath": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper.cpp",
3
+ "KernelSourcePath": "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/concat_adf_wrapper.cpp",
4
+ "UseCases": [
5
+ {
6
+ "Index": 0,
7
+ "KernelFunction": "mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>",
8
+ "InitializationFunction": "",
9
+ "KernelClassCtor": "",
10
+ "Instances": [
11
+ "i897",
12
+ "i898",
13
+ "i899",
14
+ "i900",
15
+ "i902",
16
+ "i903",
17
+ "i904",
18
+ "i905",
19
+ "i907",
20
+ "i908",
21
+ "i909",
22
+ "i910",
23
+ "i912",
24
+ "i913",
25
+ "i914",
26
+ "i915",
27
+ "i964",
28
+ "i965",
29
+ "i966",
30
+ "i967",
31
+ "i969",
32
+ "i970",
33
+ "i971",
34
+ "i972",
35
+ "i974",
36
+ "i975",
37
+ "i976",
38
+ "i977",
39
+ "i979",
40
+ "i980",
41
+ "i981",
42
+ "i982",
43
+ "i987",
44
+ "i988",
45
+ "i989",
46
+ "i990",
47
+ "i992",
48
+ "i993",
49
+ "i994",
50
+ "i995",
51
+ "i997",
52
+ "i998",
53
+ "i999",
54
+ "i1000",
55
+ "i1002",
56
+ "i1003",
57
+ "i1004",
58
+ "i1005"
59
+ ]
60
+ }
61
+ ],
62
+ "AccessRecords": [],
63
+ "ControlRegsUsage": {
64
+ "RndRecords": {},
65
+ "SatRecords": {},
66
+ "SymSatRecords": {}
67
+ },
68
+ "ParameterLoads": {
69
+ "__regcall3__chessintr___Pvoid_byte_incr___Pvoid___sint": [
70
+ "may",
71
+ "may"
72
+ ],
73
+ "__regcall3__chessintr___sint_read_coreid_": [],
74
+ "__regcall3__chessintr_uint2_t_uint2_t___uint": [
75
+ "may"
76
+ ],
77
+ "__regcall3__chessintr_uint4_t_uint4_t___uint": [
78
+ "may"
79
+ ],
80
+ "__regcall3__chessintr_v32bfloat16_undef_v32bfloat16": [],
81
+ "__regcall3__chessintr_v32int16_broadcast_s16___sint": [
82
+ "may"
83
+ ],
84
+ "concat_adf_init": [],
85
+ "concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> >, adf::io_buffer_config<adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0U> > >": [
86
+ "sometimes",
87
+ "sometimes",
88
+ "sometimes",
89
+ "sometimes"
90
+ ],
91
+ "llvm.chess.copy.p5": [
92
+ "may"
93
+ ],
94
+ "llvm.chess.copy.p6": [
95
+ "may"
96
+ ],
97
+ "llvm.chess.copy.p7": [
98
+ "may"
99
+ ],
100
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint2_ts.i32.p1": [
101
+ "may",
102
+ "may",
103
+ "may",
104
+ "may",
105
+ "may",
106
+ "may",
107
+ "may"
108
+ ],
109
+ "llvm.chess.init.customint.s_struct.ipd.custom_type.uint4_ts.i32.p1": [
110
+ "may",
111
+ "may",
112
+ "may",
113
+ "may",
114
+ "may",
115
+ "may",
116
+ "may"
117
+ ],
118
+ "llvm.dbg.declare": [
119
+ "may",
120
+ "may",
121
+ "may"
122
+ ],
123
+ "llvm.dbg.value": [
124
+ "may",
125
+ "may",
126
+ "may"
127
+ ],
128
+ "llvm.lifetime.end.p0": [
129
+ "may",
130
+ "may"
131
+ ],
132
+ "llvm.lifetime.start.p0": [
133
+ "may",
134
+ "may"
135
+ ],
136
+ "llvm.memset.p0.i32": [
137
+ "may",
138
+ "may",
139
+ "may",
140
+ "may"
141
+ ],
142
+ "llvm.noalias.decl.p0.p0.i32": [
143
+ "may",
144
+ "may",
145
+ "may"
146
+ ],
147
+ "llvm.noalias.p0.p0.p0.i32": [
148
+ "may",
149
+ "may",
150
+ "may",
151
+ "may",
152
+ "may"
153
+ ],
154
+ "llvm.noalias.p5.p0.p0.i32": [
155
+ "may",
156
+ "may",
157
+ "may",
158
+ "may",
159
+ "may"
160
+ ],
161
+ "llvm.noalias.p6.p0.p0.i32": [
162
+ "may",
163
+ "may",
164
+ "may",
165
+ "may",
166
+ "may"
167
+ ],
168
+ "llvm.noalias.p7.p0.p0.i32": [
169
+ "may",
170
+ "may",
171
+ "may",
172
+ "may",
173
+ "may"
174
+ ]
175
+ }
176
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper_spec.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "KernelAnalysisSpec": {
3
+ "ModulePath": "/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/i897_wrap_concat_adf_wrapper.cpp",
4
+ "KernelSourcePath": "/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/concat_adf_wrapper.cpp",
5
+ "SpecFile": "i897_wrap_concat_adf_wrapper_spec.json",
6
+ "ResultFile": "i897_wrap_concat_adf_wrapper_results.json",
7
+ "UseCases": [
8
+ {
9
+ "Index": 0,
10
+ "KernelFunction": "mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>",
11
+ "InitializationFunction": "",
12
+ "KernelClassCtor": "",
13
+ "Instances": [
14
+ "i897",
15
+ "i898",
16
+ "i899",
17
+ "i900",
18
+ "i902",
19
+ "i903",
20
+ "i904",
21
+ "i905",
22
+ "i907",
23
+ "i908",
24
+ "i909",
25
+ "i910",
26
+ "i912",
27
+ "i913",
28
+ "i914",
29
+ "i915",
30
+ "i964",
31
+ "i965",
32
+ "i966",
33
+ "i967",
34
+ "i969",
35
+ "i970",
36
+ "i971",
37
+ "i972",
38
+ "i974",
39
+ "i975",
40
+ "i976",
41
+ "i977",
42
+ "i979",
43
+ "i980",
44
+ "i981",
45
+ "i982",
46
+ "i987",
47
+ "i988",
48
+ "i989",
49
+ "i990",
50
+ "i992",
51
+ "i993",
52
+ "i994",
53
+ "i995",
54
+ "i997",
55
+ "i998",
56
+ "i999",
57
+ "i1000",
58
+ "i1002",
59
+ "i1003",
60
+ "i1004",
61
+ "i1005"
62
+ ]
63
+ }
64
+ ]
65
+ }
66
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/ir/pm_reload_analysis0_guidance.json ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "Alignment Hints": [
3
+ "Alignment of global array constinit is 4 bytes; automatically aligning it to 64 bytes.",
4
+ "Alignment of global array constinit.1 is 4 bytes; automatically aligning it to 64 bytes.",
5
+ "Alignment of global array constinit.7 is 4 bytes; automatically aligning it to 64 bytes.",
6
+ "Alignment of global array constinit.9 is 4 bytes; automatically aligning it to 64 bytes.",
7
+ "Alignment of global array constinit.10 is 4 bytes; automatically aligning it to 64 bytes.",
8
+ "Alignment of global array constinit.14 is 4 bytes; automatically aligning it to 64 bytes.",
9
+ "Alignment of global array constinit.15 is 4 bytes; automatically aligning it to 64 bytes.",
10
+ "Alignment of global array constinit.16 is 4 bytes; automatically aligning it to 64 bytes.",
11
+ "Alignment of global array constinit.17 is 4 bytes; automatically aligning it to 64 bytes.",
12
+ "Alignment of global array __const._Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj.coeffs is 2 bytes; automatically aligning it to 64 bytes.",
13
+ "Alignment of global array __const._Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj.coeffs_asymmetric is 2 bytes; automatically aligning it to 64 bytes."
14
+ ],
15
+ "Size Hints": [
16
+ "Global array sigmoid_lut<0u, 256u>::data_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.",
17
+ "Global array sigmoid_lut<0u, 256u>::data_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.",
18
+ "Global array gelu_lut_32<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.",
19
+ "Global array gelu_lut_32<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.",
20
+ "Global array tanh_lut<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.",
21
+ "Global array tanh_lut<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.",
22
+ "Global array log_f32_lut<256u>::fraction_table_ab_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.",
23
+ "Global array log_f32_lut<256u>::fraction_table_cd_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.",
24
+ "Global array exp2_lut<512u>::exp2_table_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.",
25
+ "Global array exp2_lut<512u>::exp2_table_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer."
26
+ ],
27
+ "Name Mangling Hints": [],
28
+ "Global Var Read-Before-Write Hints": [],
29
+ "Global Var Conflict Hints": [],
30
+ "Operator Hints": [
31
+ "Operator srem at line -1 in file unknown will degrade performance",
32
+ "Operator srem at line -1 in file unknown will degrade performance",
33
+ "Operator srem at line -1 in file unknown will degrade performance",
34
+ "Operator srem at line -1 in file unknown will degrade performance",
35
+ "Operator srem at line 505 in file backend/superkernels.cpp will degrade performance",
36
+ "Operator srem at line 508 in file backend/superkernels.cpp will degrade performance",
37
+ "Operator srem at line 511 in file backend/superkernels.cpp will degrade performance",
38
+ "Operator srem at line 554 in file backend/superkernels.cpp will degrade performance",
39
+ "Operator srem at line 558 in file backend/superkernels.cpp will degrade performance",
40
+ "Operator srem at line 562 in file backend/superkernels.cpp will degrade performance",
41
+ "Operator srem at line 353 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common/reduce_base_c8.h will degrade performance",
42
+ "Operator urem at line 213 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/../detail/aie2/../ld_st.hpp will degrade performance",
43
+ "Operator srem at line -1 in file unknown will degrade performance",
44
+ "Operator srem at line -1 in file unknown will degrade performance",
45
+ "Operator srem at line -1 in file unknown will degrade performance",
46
+ "Operator srem at line -1 in file unknown will degrade performance",
47
+ "Operator srem at line -1 in file unknown will degrade performance",
48
+ "Operator srem at line -1 in file unknown will degrade performance",
49
+ "Operator srem at line -1 in file unknown will degrade performance",
50
+ "Operator urem at line 151 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../detail/aie2p/accum.hpp will degrade performance",
51
+ "Operator srem at line -1 in file unknown will degrade performance",
52
+ "Operator srem at line -1 in file unknown will degrade performance",
53
+ "Operator srem at line -1 in file unknown will degrade performance",
54
+ "Operator srem at line -1 in file unknown will degrade performance",
55
+ "Operator srem at line -1 in file unknown will degrade performance",
56
+ "Operator srem at line -1 in file unknown will degrade performance",
57
+ "Operator srem at line -1 in file unknown will degrade performance",
58
+ "Operator srem at line -1 in file unknown will degrade performance",
59
+ "Operator srem at line -1 in file unknown will degrade performance",
60
+ "Operator srem at line -1 in file unknown will degrade performance",
61
+ "Operator srem at line -1 in file unknown will degrade performance",
62
+ "Operator urem at line 213 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/../detail/aie2/../ld_st.hpp will degrade performance",
63
+ "Operator srem at line 93 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
64
+ "Operator srem at line 94 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
65
+ "Operator srem at line 96 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
66
+ "Operator srem at line 125 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
67
+ "Operator srem at line 93 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
68
+ "Operator srem at line 94 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
69
+ "Operator srem at line 96 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
70
+ "Operator srem at line 123 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp will degrade performance",
71
+ "Operator urem at line 213 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/../detail/aie2/../ld_st.hpp will degrade performance",
72
+ "Operator srem at line -1 in file unknown will degrade performance",
73
+ "Operator srem at line -1 in file unknown will degrade performance",
74
+ "Operator srem at line -1 in file unknown will degrade performance",
75
+ "Operator urem at line 533 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp will degrade performance",
76
+ "Operator srem at line -1 in file unknown will degrade performance",
77
+ "Operator srem at line -1 in file unknown will degrade performance",
78
+ "Operator srem at line -1 in file unknown will degrade performance",
79
+ "Operator urem at line 860 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/../detail/aie2/vector.hpp will degrade performance",
80
+ "Operator urem at line 81 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/slice_hcwc8_params.h will degrade performance",
81
+ "Operator urem at line 82 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/slice_hcwc8_params.h will degrade performance",
82
+ "Operator urem at line 97 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/slice_hcwc8_params.h will degrade performance",
83
+ "Operator urem at line 98 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/slice_hcwc8_params.h will degrade performance",
84
+ "Operator urem at line 109 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/slice_hcwc8_params.h will degrade performance",
85
+ "Operator urem at line 110 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/slice_hcwc8_params.h will degrade performance",
86
+ "Operator srem at line -1 in file unknown will degrade performance"
87
+ ],
88
+ "Bank Conflict Hints": [],
89
+ "RestrictAliasAnalysisHints": []
90
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.# ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ da125a439e60b7ff8e916687519e80f6ec21fffa
2
+ 1a735f496f1284ab86135ede88939a8aeeb375a3
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.## ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 9b95382854d1fe348e1592cb9aa1e420dfe33947
2
+ 92e103875c6a39bc8cdbe4a21c02c5a94ba3cc96
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.calltree ADDED
@@ -0,0 +1,186 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:37:40 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/pm_reload_analysis0 ../Release/pm_reload_analysis0.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -cpm_reload_analysis0.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork495 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z18pm_reload_analysisv
10
+ _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
11
+ _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj
12
+ _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
13
+ _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
14
+ _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
15
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
16
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
17
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
18
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
19
+ _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
20
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
21
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
22
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
23
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (*)
24
+ _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
25
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
26
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
27
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
28
+ _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
29
+ _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
30
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
31
+ _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
32
+ _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
33
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
34
+ _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
35
+ _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
36
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E
37
+ _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
38
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
39
+ _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
40
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
41
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
42
+ _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
43
+ _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
44
+ _ZN12me_primitive10udiv_dstepEjjRjS0_
45
+ _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
46
+ _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE
47
+ _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (*)
48
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (*)
49
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (*)
50
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (*)
51
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (*)
52
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (*)
53
+ _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
54
+ _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv
55
+ _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t
56
+ _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E
57
+ _ZN12me_primitive10udiv_dstepEjjRjS0_ (*)
58
+ _ZN12me_primitive10udiv_dstepEjjRjS0_ (*)
59
+ int32_to_float32
60
+ _ZL28normalizeRoundAndPackFloat32iij
61
+ _ZL19roundAndPackFloat32iij
62
+ float32_add
63
+ _ZL14addFloat32Sigsjji
64
+ _ZL19propagateFloat32NaNjj
65
+ _ZL19roundAndPackFloat32iij (*)
66
+ _ZL14subFloat32Sigsjji
67
+ _ZL19propagateFloat32NaNjj (*)
68
+ _ZL28normalizeRoundAndPackFloat32iij (*)
69
+ _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
70
+ _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
71
+ _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
72
+ _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
73
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
74
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
75
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
76
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (*)
77
+ _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
78
+ _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
79
+ _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
80
+ _Z19superkernel_avgpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
81
+ _Z22setup_avgpool2d_paramsI8bfloat16EvPT_R25avgpool2d_internal_paramsIS1_Eh
82
+ _Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E
83
+ int32_to_float32 (*)
84
+ _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj
85
+ _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj
86
+ _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params
87
+ _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
88
+ _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params
89
+ int32_to_float32 (*)
90
+ _ZN12me_primitive10udiv_dstepEjjRjS0_ (*)
91
+ _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj
92
+
93
+
94
+ Call tree stack and functions sizes:
95
+
96
+ stack stack stack call func func function name
97
+ desc level level desc
98
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
99
+ 768 2624 0 0 3030 41432 _Z18pm_reload_analysisv
100
+ 0 0 1 1 470 2054 _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
101
+ 0 0 1 2 1584 1584 _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj <tail call>
102
+ 192 192 1 1 674 1456 _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
103
+ 0 0 2 2 782 782 _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
104
+ 64 256 1 1 488 1362 _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
105
+ 64 64 2 2 74 190 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
106
+ 0 0 3 3 116 116 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
107
+ 64 192 2 2 150 684 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
108
+ 128 128 3 3 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
109
+ 64 192 1 1 602 1366 _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
110
+ 64 64 2 2 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
111
+ 0 0 3 3 116 116 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
112
+ 0 128 2 2 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
113
+ 128 128 2 3 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
114
+ 64 128 1 1 602 1056 _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
115
+ 64 64 2 2 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
116
+ 0 0 3 3 24 24 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
117
+ 0 0 2 2 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
118
+ 64 192 1 1 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
119
+ 64 64 2 2 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
120
+ 128 128 2 2 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
121
+ 0 0 3 3 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
122
+ 64 192 1 1 488 1220 _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
123
+ 64 128 2 2 62 304 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
124
+ 64 64 3 3 162 186 _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
125
+ 0 0 4 4 24 24 _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
126
+ 0 0 2 3 56 56 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E <tail call>
127
+ 128 128 2 2 114 428 _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
128
+ 0 0 3 3 314 314 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
129
+ 64 64 1 1 488 830 _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
130
+ 0 0 2 2 100 100 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
131
+ 0 0 2 2 242 242 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
132
+ 128 192 1 1 478 2014 _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
133
+ 64 64 2 2 672 814 _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
134
+ 0 0 3 3 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
135
+ 0 0 2 2 722 722 _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
136
+ 64 192 1 1 1126 6454 _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE
137
+ 64 64 2 2 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
138
+ 64 64 2 2 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (*)
139
+ 64 64 2 2 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (*)
140
+ 128 128 2 2 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (*)
141
+ 0 0 2 2 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
142
+ 0 128 2 2 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (*)
143
+ 128 384 1 1 2676 9838 _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
144
+ 64 64 2 2 1588 1588 _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv
145
+ 0 0 2 2 670 670 _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t
146
+ 256 256 2 2 2680 2822 _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E
147
+ 0 0 3 3 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
148
+ 0 0 2 2 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
149
+ 0 0 2 2 114 530 int32_to_float32
150
+ 0 0 2 3 24 416 _ZL28normalizeRoundAndPackFloat32iij <tail call>
151
+ 0 0 2 4 392 392 _ZL19roundAndPackFloat32iij <tail call>
152
+ 0 0 2 2 64 1968 float32_add
153
+ 0 0 3 3 624 1128 _ZL14addFloat32Sigsjji
154
+ 0 0 4 4 112 112 _ZL19propagateFloat32NaNjj
155
+ 0 0 3 4 392 392 _ZL19roundAndPackFloat32iij <tail call>
156
+ 0 0 2 3 752 1280 _ZL14subFloat32Sigsjji <tail call>
157
+ 0 0 3 4 112 112 _ZL19propagateFloat32NaNjj
158
+ 0 0 2 4 24 416 _ZL28normalizeRoundAndPackFloat32iij <tail call> (*)
159
+ 64 64 1 1 488 928 _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
160
+ 0 0 2 2 62 62 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
161
+ 0 0 2 2 378 378 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
162
+ 64 192 1 1 602 1342 _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
163
+ 64 64 2 2 74 190 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
164
+ 0 0 3 3 116 116 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
165
+ 0 128 2 2 16 550 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
166
+ 128 128 2 3 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
167
+ 64 448 1 1 488 1512 _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
168
+ 0 0 2 2 62 62 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
169
+ 384 384 2 2 962 962 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
170
+ 128 320 1 1 506 2736 _Z19superkernel_avgpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
171
+ 64 64 2 2 780 780 _Z22setup_avgpool2d_paramsI8bfloat16EvPT_R25avgpool2d_internal_paramsIS1_Eh
172
+ 192 192 2 2 920 1450 _Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E
173
+ 0 0 3 3 114 530 int32_to_float32 (*)
174
+ 64 64 1 1 114 650 _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj
175
+ 0 0 2 2 74 74 _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj
176
+ 0 0 1 2 462 462 _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params <tail call>
177
+ 64 1856 1 1 1374 5828 _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
178
+ 1792 1792 2 2 3782 4312 _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params
179
+ 0 0 3 3 114 530 int32_to_float32 (*)
180
+ 0 0 2 2 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
181
+ 0 0 1 1 818 818 _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj
182
+
183
+
184
+ Maximum call level : 4
185
+ Maximum stack level: 4
186
+ Maximum stack size : 2624
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.cmic2 ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.cmico ADDED
@@ -0,0 +1 @@
 
 
1
+ +Mdec
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.map ADDED
@@ -0,0 +1,568 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:37:44 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/pm_reload_analysis0 ../Release/pm_reload_analysis0.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -cpm_reload_analysis0.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork495 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ Memory map for memory 'DM_stack':
9
+
10
+ Size = 1048576
11
+ Width = 8 bits
12
+ Offset = 0
13
+ Used = 32768
14
+
15
+ 0x00070000..0x00077fff ( 32768 items) : Stack
16
+
17
+ Memory map for memory 'DMb':
18
+
19
+ Size = 1048576
20
+ Width = 8 bits
21
+ Offset = 0
22
+ Used = 35613
23
+
24
+ 0x00000000..0x0006ffff ( 458752 items) : Reserved
25
+ 0x00070000..0x00077fff ( 32768 items) : Stack
26
+ 0x00078000..0x00078003 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
27
+ 0x00078004..0x00078007 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
28
+ 0x00078008..0x0007800b ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
29
+ 0x0007800c..0x0007800f ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
30
+ 0x00078010..0x00078013 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL8core_row (Data, Local, .bss.DMb.4)
31
+ 0x00078014..0x00078017 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
32
+ 0x00078018..0x0007801b ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL10ifmsv_size (Data, Local, .bss.DMb.4)
33
+ 0x0007801c..0x0007801f ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
34
+ 0x00078020..0x00078023 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL11reduce_axis (Data, Local, .bss.DMb.4)
35
+ 0x00078024..0x00078027 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL8l3_width (Data, Local, .bss.DMb.4)
36
+ 0x00078028..0x0007802b ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL9l3_height (Data, Local, .bss.DMb.4)
37
+ 0x0007802c..0x0007802f ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL8l3_depth (Data, Local, .bss.DMb.4)
38
+ 0x00078030..0x00078033 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL10width_iter (Data, Local, .bss.DMb.4)
39
+ 0x00078034..0x00078037 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL11height_iter (Data, Local, .bss.DMb.4)
40
+ 0x00078038..0x0007803b ( 4 items) : ../Release/pm_reload_analysis0.o::_ZN9ns_concatL11kernel_iterE (Data, Local, .bss.DMb.4)
41
+ 0x0007803c..0x0007803f ( 4 items) : ../Release/pm_reload_analysis0.o::_ZN9ns_concatL8core_colE (Data, Local, .bss.DMb.4)
42
+ 0x00078040..0x00078043 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZN9ns_concatL8core_rowE (Data, Local, .bss.DMb.4)
43
+ 0x00078044..0x00078047 ( 4 items) : ../Release/pm_reload_analysis0.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter (Data, Weak, .bss.DMb.4)
44
+ 0x00078048..0x0007804b ( 4 items) : ../Release/pm_reload_analysis0.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter (Data, Weak, .bss.DMb.4)
45
+ 0x0007804c..0x0007804f ( 4 items) : ../Release/pm_reload_analysis0.o::_ZL8num_iter (Data, Local, .data.DMb.4)
46
+ 0x00078050..0x00078053 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
47
+ 0x00078054..0x00078054 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
48
+ 0x00078058..0x0007805b ( 4 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::float_rounding_mode (Data, Global, .bss.DMb.4)
49
+ 0x00078080..0x000780ff ( 128 items) : ../Release/pm_reload_analysis0.o::reduce_mean_c8_params (Data, Global, .data.DMb.64)
50
+ 0x00078100..0x0007813f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit (Data, Local, .rodata.DMb.64)
51
+ 0x00078140..0x0007817f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___7 (Data, Local, .rodata.DMb.64)
52
+ 0x00078180..0x000781c3 ( 68 items) : ../Release/pm_reload_analysis0.o::constinit___9 (Data, Local, .rodata.DMb.64)
53
+ 0x00078200..0x0007823f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___10 (Data, Local, .rodata.DMb.64)
54
+ 0x00078240..0x0007827f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___14 (Data, Local, .rodata.DMb.64)
55
+ 0x00078280..0x000782bf ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___16 (Data, Local, .rodata.DMb.64)
56
+ 0x000782c0..0x000782df ( 32 items) : ../Release/pm_reload_analysis0.o::__const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs (Data, Local, .rodata.DMb.64)
57
+ 0x00078300..0x0007831f ( 32 items) : ../Release/pm_reload_analysis0.o::__const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs_asymmetric (Data, Local, .rodata.DMb.64)
58
+ 0x00078320..0x0007835f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___2 (Data, Local, .rodata.DMb.4)
59
+ 0x00078360..0x0007839f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___4 (Data, Local, .rodata.DMb.4)
60
+ 0x000783a0..0x000783df ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___5 (Data, Local, .rodata.DMb.4)
61
+ 0x000783e0..0x0007841f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___6 (Data, Local, .rodata.DMb.4)
62
+ 0x00078420..0x0007845f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___8 (Data, Local, .rodata.DMb.4)
63
+ 0x00078460..0x0007849f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___11 (Data, Local, .rodata.DMb.4)
64
+ 0x000784a0..0x000784df ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___12 (Data, Local, .rodata.DMb.4)
65
+ 0x000784e0..0x0007851f ( 64 items) : ../Release/pm_reload_analysis0.o::constinit___13 (Data, Local, .rodata.DMb.4)
66
+ 0x00078540..0x0007857f ( 64 items) : ../Release/pm_reload_analysis0.o::_ZZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_KjE6params (Data, Weak, .bss.DMb.64)
67
+ 0x00078580..0x000785bf ( 64 items) : ../Release/pm_reload_analysis0.o::add1d_attribute_broadcasting_params (Data, Global, .bss.DMb.64)
68
+ 0x000785c0..0x000785ff ( 64 items) : ../Release/pm_reload_analysis0.o::mul1d_attribute_broadcasting_params (Data, Global, .bss.DMb.64)
69
+ 0x00078600..0x0007863f ( 64 items) : ../Release/pm_reload_analysis0.o::add1d_params (Data, Global, .bss.DMb.64)
70
+ 0x00078640..0x0007867f ( 64 items) : ../Release/pm_reload_analysis0.o::mul1d_params (Data, Global, .bss.DMb.64)
71
+ 0x00078680..0x000786bf ( 64 items) : ../Release/pm_reload_analysis0.o::sub1d_params (Data, Global, .bss.DMb.64)
72
+ 0x000786c0..0x000786ff ( 64 items) : ../Release/pm_reload_analysis0.o::clip1d_params (Data, Global, .bss.DMb.64)
73
+ 0x00078700..0x0007873f ( 64 items) : ../Release/pm_reload_analysis0.o::sigmoid1d_params (Data, Global, .bss.DMb.64)
74
+ 0x00078740..0x0007877f ( 64 items) : ../Release/pm_reload_analysis0.o::tanh1d_params (Data, Global, .bss.DMb.64)
75
+ 0x00078780..0x0007893f ( 448 items) : ../Release/pm_reload_analysis0.o::conv2d_params (Data, Global, .bss.DMb.64)
76
+ 0x00078940..0x00078a3f ( 256 items) : ../Release/pm_reload_analysis0.o::conv2d_dw_params (Data, Global, .bss.DMb.64)
77
+ 0x00078a40..0x00078a7f ( 64 items) : ../Release/pm_reload_analysis0.o::avgpool2d_params (Data, Global, .bss.DMb.64)
78
+ 0x00078a80..0x00078abf ( 64 items) : ../Release/pm_reload_analysis0.o::pad_3d_params (Data, Global, .bss.DMb.64)
79
+ 0x00078ac0..0x00078b3f ( 128 items) : ../Release/pm_reload_analysis0.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params (Data, Weak, .bss.DMb.64)
80
+ 0x00078b40..0x00078bbf ( 128 items) : ../Release/pm_reload_analysis0.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params (Data, Weak, .bss.DMb.64)
81
+
82
+ Memory map for memory 'PM':
83
+
84
+ Size = 1048576
85
+ Width = 8 bits
86
+ Offset = 0
87
+ Used = 41432
88
+
89
+ 0x00000000..0x00000bd5 ( 3030 items) : ../Release/pm_reload_analysis0.o::_Z18pm_reload_analysisv (Function, Global, .text) (stack frame size = 768)
90
+
91
+ Called functions : _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
92
+ _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
93
+ _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
94
+ _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
95
+ _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
96
+ _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
97
+ _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
98
+ _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
99
+ _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
100
+ _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE
101
+ _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
102
+ _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
103
+ _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
104
+ _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
105
+ _Z19superkernel_avgpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
106
+ _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj
107
+ _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
108
+ _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj
109
+
110
+ Referenced symbols: constinit
111
+ constinit___2
112
+ constinit___4
113
+ constinit___5
114
+ constinit___6
115
+ constinit___7
116
+ constinit___8
117
+ constinit___9
118
+ constinit___10
119
+ constinit___11
120
+ constinit___12
121
+ constinit___13
122
+ constinit___14
123
+ constinit___16
124
+
125
+ 0x00000be0..0x00001175 ( 1430 items) : ../Release/pm_reload_analysis0.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
126
+ 0x00001180..0x0000128d ( 270 items) : ../Release/pm_reload_analysis0.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
127
+
128
+ Referenced symbols: _ZN12me_primitive11control_rndE
129
+
130
+ 0x00001290..0x00001bf9 ( 2410 items) : ../Release/pm_reload_analysis0.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
131
+
132
+ Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
133
+
134
+ Referenced symbols: _ZN12me_primitive11control_rndE
135
+
136
+ 0x00001c00..0x00001e37 ( 568 items) : ../Release/pm_reload_analysis0.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
137
+
138
+ Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
139
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
140
+
141
+ Referenced symbols: _ZL9curr_iter
142
+ conv2d_params
143
+ _ZN12me_primitive11control_rndE
144
+ _ZN12me_primitive11control_satE
145
+ _ZL14num_depth_iter
146
+ _ZL8num_iter
147
+ _ZL10depth_iter
148
+ _ZL11total_iters
149
+
150
+ 0x00001e40..0x00001e57 ( 24 items) : ../Release/pm_reload_analysis0.o::_ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
151
+ 0x00001e60..0x00001f01 ( 162 items) : ../Release/pm_reload_analysis0.o::_ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
152
+
153
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
154
+
155
+ 0x00001f10..0x00001f47 ( 56 items) : ../Release/pm_reload_analysis0.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
156
+ 0x00001f50..0x00001f8d ( 62 items) : ../Release/pm_reload_analysis0.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
157
+
158
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
159
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E
160
+
161
+ 0x00001f90..0x000020c9 ( 314 items) : ../Release/pm_reload_analysis0.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
162
+
163
+ Referenced symbols: _ZN12me_primitive11control_rndE
164
+
165
+ 0x000020d0..0x00002141 ( 114 items) : ../Release/pm_reload_analysis0.o::_ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 128)
166
+
167
+ Called functions : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
168
+
169
+ 0x00002150..0x00002337 ( 488 items) : ../Release/pm_reload_analysis0.o::_Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
170
+
171
+ Called functions : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
172
+ _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
173
+
174
+ Referenced symbols: _ZL9curr_iter
175
+ _ZL8core_row
176
+ add1d_attribute_broadcasting_params
177
+ _ZN12me_primitive11control_rndE
178
+ _ZN12me_primitive11control_satE
179
+ _ZL11ifm1_offset
180
+ _ZL8num_iter
181
+
182
+ 0x00002340..0x000023a3 ( 100 items) : ../Release/pm_reload_analysis0.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
183
+ 0x000023b0..0x000024a1 ( 242 items) : ../Release/pm_reload_analysis0.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
184
+ 0x000024b0..0x00002697 ( 488 items) : ../Release/pm_reload_analysis0.o::_Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
185
+
186
+ Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
187
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
188
+
189
+ Referenced symbols: _ZL9curr_iter
190
+ _ZL8core_row
191
+ clip1d_params
192
+ _ZN12me_primitive11control_rndE
193
+ _ZN12me_primitive11control_satE
194
+ _ZL11ifm1_offset
195
+ _ZL8num_iter
196
+
197
+ 0x000026a0..0x00002713 ( 116 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
198
+ 0x00002720..0x00002769 ( 74 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
199
+
200
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
201
+
202
+ 0x00002770..0x00002985 ( 534 items) : ../Release/pm_reload_analysis0.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
203
+
204
+ Referenced symbols: _ZN12me_primitive11control_rndE
205
+
206
+ 0x00002990..0x00002a25 ( 150 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 64)
207
+
208
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
209
+
210
+ 0x00002a30..0x00002c17 ( 488 items) : ../Release/pm_reload_analysis0.o::_Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
211
+
212
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
213
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
214
+
215
+ Referenced symbols: _ZL9curr_iter
216
+ _ZL8core_row
217
+ mul1d_attribute_broadcasting_params
218
+ _ZN12me_primitive11control_rndE
219
+ _ZN12me_primitive11control_satE
220
+ _ZL11ifm1_offset
221
+ _ZL8num_iter
222
+
223
+ 0x00002c20..0x00002c5d ( 62 items) : ../Release/pm_reload_analysis0.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
224
+ 0x00002c60..0x00002dd9 ( 378 items) : ../Release/pm_reload_analysis0.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
225
+
226
+ Referenced symbols: _ZN12me_primitive11control_rndE
227
+
228
+ 0x00002de0..0x00002fc7 ( 488 items) : ../Release/pm_reload_analysis0.o::_Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
229
+
230
+ Called functions : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
231
+ _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
232
+
233
+ Referenced symbols: _ZL9curr_iter
234
+ _ZL8core_row
235
+ sigmoid1d_params
236
+ _ZN12me_primitive11control_rndE
237
+ _ZN12me_primitive11control_satE
238
+ _ZL11ifm1_offset
239
+ _ZL8num_iter
240
+
241
+ 0x00002fd0..0x0000300d ( 62 items) : ../Release/pm_reload_analysis0.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
242
+ 0x00003010..0x000033d1 ( 962 items) : ../Release/pm_reload_analysis0.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 384)
243
+
244
+ Referenced symbols: _ZN12me_primitive11control_rndE
245
+
246
+ 0x000033e0..0x000035c7 ( 488 items) : ../Release/pm_reload_analysis0.o::_Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
247
+
248
+ Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
249
+ _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
250
+
251
+ Referenced symbols: _ZL9curr_iter
252
+ _ZL8core_row
253
+ tanh1d_params
254
+ _ZN12me_primitive11control_rndE
255
+ _ZN12me_primitive11control_satE
256
+ _ZL11ifm1_offset
257
+ _ZL8num_iter
258
+
259
+ 0x000035d0..0x000038db ( 780 items) : ../Release/pm_reload_analysis0.o::_Z22setup_avgpool2d_paramsI8bfloat16EvPT_R25avgpool2d_internal_paramsIS1_Eh (Function, Weak, .text) (stack frame size = 64)
260
+ 0x000038e0..0x00003c77 ( 920 items) : ../Release/pm_reload_analysis0.o::_Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E (Function, Weak, .text) (stack frame size = 192)
261
+
262
+ Called functions : int32_to_float32
263
+
264
+ Referenced symbols: _ZN12me_primitive11control_rndE
265
+
266
+ 0x00003c80..0x00003e79 ( 506 items) : ../Release/pm_reload_analysis0.o::_Z19superkernel_avgpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 128)
267
+
268
+ Called functions : _Z22setup_avgpool2d_paramsI8bfloat16EvPT_R25avgpool2d_internal_paramsIS1_Eh
269
+ _Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E
270
+
271
+ Referenced symbols: _ZL9curr_iter
272
+ _ZL8core_row
273
+ _ZN12me_primitive11control_rndE
274
+ _ZN12me_primitive11control_satE
275
+ avgpool2d_params
276
+ _ZL10ifmsv_size
277
+ _ZL8num_iter
278
+
279
+ 0x00003e80..0x00003ef3 ( 116 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
280
+ 0x00003f00..0x00003f61 ( 98 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
281
+
282
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
283
+
284
+ 0x00003f70..0x00003f7f ( 16 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
285
+
286
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
287
+
288
+ 0x00003f80..0x000041d9 ( 602 items) : ../Release/pm_reload_analysis0.o::_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
289
+
290
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
291
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
292
+
293
+ Referenced symbols: _ZL9curr_iter
294
+ _ZL8core_row
295
+ add1d_params
296
+ _ZN12me_primitive11control_rndE
297
+ _ZN12me_primitive11control_satE
298
+ _ZL11ifm1_offset
299
+ _ZL11ifm2_offset
300
+ _ZL8num_iter
301
+
302
+ 0x000041e0..0x000041f7 ( 24 items) : ../Release/pm_reload_analysis0.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
303
+ 0x00004200..0x00004289 ( 138 items) : ../Release/pm_reload_analysis0.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
304
+
305
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
306
+
307
+ 0x00004290..0x000043b3 ( 292 items) : ../Release/pm_reload_analysis0.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
308
+
309
+ Referenced symbols: _ZN12me_primitive11control_rndE
310
+
311
+ 0x000043c0..0x00004619 ( 602 items) : ../Release/pm_reload_analysis0.o::_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
312
+
313
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
314
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
315
+
316
+ Referenced symbols: _ZL9curr_iter
317
+ _ZL8core_row
318
+ mul1d_params
319
+ _ZN12me_primitive11control_rndE
320
+ _ZN12me_primitive11control_satE
321
+ _ZL11ifm1_offset
322
+ _ZL11ifm2_offset
323
+ _ZL8num_iter
324
+
325
+ 0x00004620..0x00004693 ( 116 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
326
+ 0x000046a0..0x000046e9 ( 74 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
327
+
328
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
329
+
330
+ 0x000046f0..0x000046ff ( 16 items) : ../Release/pm_reload_analysis0.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
331
+
332
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
333
+
334
+ 0x00004700..0x00004959 ( 602 items) : ../Release/pm_reload_analysis0.o::_Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
335
+
336
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
337
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
338
+
339
+ Referenced symbols: _ZL9curr_iter
340
+ _ZL8core_row
341
+ sub1d_params
342
+ _ZN12me_primitive11control_rndE
343
+ _ZN12me_primitive11control_satE
344
+ _ZL11ifm1_offset
345
+ _ZL11ifm2_offset
346
+ _ZL8num_iter
347
+
348
+ 0x00004960..0x00004bff ( 672 items) : ../Release/pm_reload_analysis0.o::_ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh (Function, Local, .text) (stack frame size = 64)
349
+
350
+ Called functions : _ZN12me_primitive10udiv_dstepEjjRjS0_
351
+
352
+ Referenced symbols: conv2d_dw_params
353
+ _ZN12me_primitive11control_rndE
354
+
355
+ 0x00004c00..0x00004ed1 ( 722 items) : ../Release/pm_reload_analysis0.o::_Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params (Function, Weak, .text) (stack frame size = 0)
356
+
357
+ Referenced symbols: _ZN12me_primitive11control_rndE
358
+
359
+ 0x00004ee0..0x000050bd ( 478 items) : ../Release/pm_reload_analysis0.o::_Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 128)
360
+
361
+ Called functions : _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
362
+ _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
363
+
364
+ Referenced symbols: _ZL9curr_iter
365
+ _ZL8core_row
366
+ _ZN12me_primitive11control_rndE
367
+ _ZN12me_primitive11control_satE
368
+ _ZL8num_iter
369
+ _ZL10ifmsv_size
370
+ conv2d_dw_params
371
+
372
+ 0x000050c0..0x000056f3 ( 1588 items) : ../Release/pm_reload_analysis0.o::_ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
373
+ 0x00005700..0x0000599d ( 670 items) : ../Release/pm_reload_analysis0.o::_Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t (Function, Weak, .text) (stack frame size = 0)
374
+ 0x000059a0..0x00006417 ( 2680 items) : ../Release/pm_reload_analysis0.o::_ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E (Function, Weak, .text) (stack frame size = 256)
375
+
376
+ Called functions : _ZN12me_primitive10udiv_dstepEjjRjS0_
377
+
378
+ Referenced symbols: _ZN12me_primitive11control_rndE
379
+
380
+ 0x00006420..0x00006e93 ( 2676 items) : ../Release/pm_reload_analysis0.o::_Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 128)
381
+
382
+ Called functions : _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv
383
+ int32_to_float32
384
+ float32_add
385
+ _ZN12me_primitive10udiv_dstepEjjRjS0_
386
+ _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t
387
+ _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E
388
+
389
+ Referenced symbols: _ZL9curr_iter
390
+ _ZL8core_row
391
+ _ZN12me_primitive11control_satE
392
+ _ZN12me_primitive11control_rndE
393
+ reduce_mean_c8_params
394
+ _ZL11reduce_axis
395
+ _ZL11ifm1_offset
396
+ pad_3d_params
397
+ _ZL8num_iter
398
+ _ZL8l3_width
399
+ _ZL9l3_height
400
+ _ZL8l3_depth
401
+ _ZL10depth_iter
402
+ _ZL10width_iter
403
+ _ZL11height_iter
404
+
405
+ 0x00006ea0..0x00007305 ( 1126 items) : ../Release/pm_reload_analysis0.o::_Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE (Function, Global, .text) (stack frame size = 64)
406
+
407
+ Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
408
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
409
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
410
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
411
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
412
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
413
+
414
+ Referenced symbols: _ZL9curr_iter
415
+ _ZL8core_row
416
+ _ZN12me_primitive11control_rndE
417
+ _ZN12me_primitive11control_satE
418
+ conv2d_params
419
+ add1d_params
420
+ mul1d_params
421
+ _ZL14num_depth_iter
422
+ _ZL11ifm2_offset
423
+ _ZL8num_iter
424
+ _ZL10depth_iter
425
+ _ZL11total_iters
426
+
427
+ 0x00007310..0x0000793f ( 1584 items) : ../Release/pm_reload_analysis0.o::_Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj (Function, Weak, .text) (stack frame size = 0)
428
+
429
+ Referenced symbols: __const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs
430
+ __const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs_asymmetric
431
+ _ZN12me_primitive11control_rndE
432
+
433
+ 0x00007940..0x00007b15 ( 470 items) : ../Release/pm_reload_analysis0.o::_ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj (Function, Weak, .text) (stack frame size = 0)
434
+
435
+ Called functions : _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj
436
+
437
+ Referenced symbols: _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter
438
+ _ZN12me_primitive11control_satE
439
+ _ZN12me_primitive11control_rndE
440
+ _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params
441
+
442
+ 0x00007b20..0x00007e2d ( 782 items) : ../Release/pm_reload_analysis0.o::_Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params (Function, Weak, .text) (stack frame size = 0)
443
+ 0x00007e30..0x000080d1 ( 674 items) : ../Release/pm_reload_analysis0.o::_ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj (Function, Weak, .text) (stack frame size = 192)
444
+
445
+ Called functions : _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
446
+
447
+ 0x000080e0..0x00008129 ( 74 items) : ../Release/pm_reload_analysis0.o::_Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj (Function, Weak, .text) (stack frame size = 0)
448
+ 0x00008130..0x000082fd ( 462 items) : ../Release/pm_reload_analysis0.o::_Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params (Function, Weak, .text) (stack frame size = 0)
449
+ 0x00008300..0x00008371 ( 114 items) : ../Release/pm_reload_analysis0.o::_ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj (Function, Weak, .text) (stack frame size = 64)
450
+
451
+ Called functions : _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj
452
+ _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params
453
+
454
+ Referenced symbols: _ZZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_KjE6params
455
+
456
+ 0x00008380..0x00009245 ( 3782 items) : ../Release/pm_reload_analysis0.o::_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params (Function, Weak, .text) (stack frame size = 1792)
457
+
458
+ Called functions : int32_to_float32
459
+
460
+ Referenced symbols: _ZN12me_primitive11control_satE
461
+ _ZN12me_primitive11control_rndE
462
+
463
+ 0x00009250..0x000097ad ( 1374 items) : ../Release/pm_reload_analysis0.o::_ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj (Function, Weak, .text) (stack frame size = 64)
464
+
465
+ Called functions : _ZN12me_primitive10udiv_dstepEjjRjS0_
466
+ _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params
467
+
468
+ Referenced symbols: _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter
469
+ _ZN12me_primitive11control_satE
470
+ _ZN12me_primitive11control_rndE
471
+ _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params
472
+
473
+ 0x000097b0..0x00009ae1 ( 818 items) : ../Release/pm_reload_analysis0.o::_ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj (Function, Weak, .text) (stack frame size = 0)
474
+
475
+ Referenced symbols: _ZN9ns_concatL11kernel_iterE
476
+ _ZN12me_primitive11control_rndE
477
+ _ZN9ns_concatL8core_rowE
478
+ _ZN12me_primitive11control_satE
479
+ _ZN9ns_concatL8core_colE
480
+
481
+ 0x00009af0..0x00009b7d ( 142 items) : me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive10udiv_dstepEjjRjS0_ (Function, Global, .text) (stack frame size = 0)
482
+ 0x00009b80..0x00009bef ( 112 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::_ZL19propagateFloat32NaNjj (Function, Local, .text) (stack frame size = 0)
483
+ 0x00009bf0..0x00009d77 ( 392 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::_ZL19roundAndPackFloat32iij (Function, Local, .text) (stack frame size = 0)
484
+
485
+ Referenced symbols: float_rounding_mode
486
+
487
+ 0x00009d80..0x00009d97 ( 24 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::_ZL28normalizeRoundAndPackFloat32iij (Function, Local, .text) (stack frame size = 0)
488
+
489
+ Called functions : _ZL19roundAndPackFloat32iij
490
+
491
+ 0x00009da0..0x00009e11 ( 114 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::int32_to_float32 (Function, Global, .text) (stack frame size = 0)
492
+
493
+ Called functions : _ZL28normalizeRoundAndPackFloat32iij
494
+
495
+ 0x00009e20..0x0000a08f ( 624 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::_ZL14addFloat32Sigsjji (Function, Local, .text) (stack frame size = 0)
496
+
497
+ Called functions : _ZL19roundAndPackFloat32iij
498
+ _ZL19propagateFloat32NaNjj
499
+
500
+ 0x0000a090..0x0000a37f ( 752 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::_ZL14subFloat32Sigsjji (Function, Local, .text) (stack frame size = 0)
501
+
502
+ Called functions : _ZL28normalizeRoundAndPackFloat32iij
503
+ _ZL19propagateFloat32NaNjj
504
+
505
+ Referenced symbols: float_rounding_mode
506
+
507
+ 0x0000a380..0x0000a3bf ( 64 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::float32_add (Function, Global, .text) (stack frame size = 0)
508
+
509
+ Called functions : _ZL14subFloat32Sigsjji
510
+ _ZL14addFloat32Sigsjji
511
+
512
+
513
+ External symbols:
514
+
515
+ __dso_handle = 0x0
516
+ _ctors_end = 0x0
517
+ _ctors_start = 0x0
518
+ _dtors_end = 0x0
519
+ _dtors_start = 0x0
520
+ _pc_end = 0xa3c0
521
+ _pc_start = 0x0
522
+ _sp_end_DM_stack = 0x78000
523
+ _sp_start_DM_stack = 0x70000
524
+
525
+ Section summary for memory 'DM_stack':
526
+
527
+ .stack File
528
+ ---------- ----------
529
+ 32768
530
+ ---------- ----------
531
+ 32768 Total
532
+
533
+ Section summary for memory 'DMb':
534
+
535
+ .bss .data .rodata File
536
+ ---------- ---------- ---------- ----------
537
+ 4 0 0 softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)
538
+ 5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
539
+ 1740 132 964 ../Release/pm_reload_analysis0.o
540
+ ---------- ---------- ---------- ----------
541
+ 1749 132 964 Total
542
+
543
+ Section summary for memory 'PM':
544
+
545
+ .text File
546
+ ---------- ----------
547
+ 2082 softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)
548
+ 142 me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
549
+ 39208 ../Release/pm_reload_analysis0.o
550
+ ---------- ----------
551
+ 41432 Total
552
+
553
+ File summary:
554
+
555
+ ../Release/pm_reload_analysis0.o
556
+ DMb 2836
557
+ PM 39208
558
+
559
+ me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
560
+ DMb 5
561
+
562
+ softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)
563
+ DMb 4
564
+ PM 2082
565
+
566
+ me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
567
+ PM 142
568
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.o.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.sdr ADDED
@@ -0,0 +1,164 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:37:44 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/pm_reload_analysis0 ../Release/pm_reload_analysis0.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -cpm_reload_analysis0.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork495 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ // Symbols in memory 'DM_bankA':
9
+ // Symbols in memory 'DM_bankAB':
10
+ // Symbols in memory 'DM_bankAC':
11
+ // Symbols in memory 'DM_bankAD':
12
+ // Symbols in memory 'DM_bankB':
13
+ // Symbols in memory 'DM_bankBC':
14
+ // Symbols in memory 'DM_bankBD':
15
+ // Symbols in memory 'DM_bankC':
16
+ // Symbols in memory 'DM_bankCD':
17
+ // Symbols in memory 'DM_bankD':
18
+ // Symbols in memory 'DM_stack':
19
+ // Symbols in memory 'DM_test':
20
+ // Symbols in memory 'DMb':
21
+ _symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter 0x00078044
22
+ _symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter 0x00078048
23
+ _symbol _ZN12me_primitive11control_satE 0x00078050
24
+ _symbol _ZN12me_primitive11control_rndE 0x00078054
25
+ _symbol float_rounding_mode 0x00078058
26
+ _symbol reduce_mean_c8_params 0x00078080
27
+ _symbol _ZZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_KjE6params 0x00078540
28
+ _symbol add1d_attribute_broadcasting_params 0x00078580
29
+ _symbol mul1d_attribute_broadcasting_params 0x000785c0
30
+ _symbol add1d_params 0x00078600
31
+ _symbol mul1d_params 0x00078640
32
+ _symbol sub1d_params 0x00078680
33
+ _symbol clip1d_params 0x000786c0
34
+ _symbol sigmoid1d_params 0x00078700
35
+ _symbol tanh1d_params 0x00078740
36
+ _symbol conv2d_params 0x00078780
37
+ _symbol conv2d_dw_params 0x00078940
38
+ _symbol avgpool2d_params 0x00078a40
39
+ _symbol pad_3d_params 0x00078a80
40
+ _symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params 0x00078ac0
41
+ _symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params 0x00078b40
42
+ // Symbols in memory 'DMh':
43
+ // Symbols in memory 'DMh_bankA':
44
+ // Symbols in memory 'DMh_bankAB':
45
+ // Symbols in memory 'DMh_bankAC':
46
+ // Symbols in memory 'DMh_bankAD':
47
+ // Symbols in memory 'DMh_bankB':
48
+ // Symbols in memory 'DMh_bankBC':
49
+ // Symbols in memory 'DMh_bankBD':
50
+ // Symbols in memory 'DMh_bankC':
51
+ // Symbols in memory 'DMh_bankCD':
52
+ // Symbols in memory 'DMh_bankD':
53
+ // Symbols in memory 'DMh_stack':
54
+ // Symbols in memory 'DMs':
55
+ // Symbols in memory 'DMs_bankA':
56
+ // Symbols in memory 'DMs_bankAB':
57
+ // Symbols in memory 'DMs_bankAC':
58
+ // Symbols in memory 'DMs_bankAD':
59
+ // Symbols in memory 'DMs_bankB':
60
+ // Symbols in memory 'DMs_bankBC':
61
+ // Symbols in memory 'DMs_bankBD':
62
+ // Symbols in memory 'DMs_bankC':
63
+ // Symbols in memory 'DMs_bankCD':
64
+ // Symbols in memory 'DMs_bankD':
65
+ // Symbols in memory 'DMs_stack':
66
+ // Symbols in memory 'DMv':
67
+ // Symbols in memory 'DMv_bankA':
68
+ // Symbols in memory 'DMv_bankAB':
69
+ // Symbols in memory 'DMv_bankAC':
70
+ // Symbols in memory 'DMv_bankAD':
71
+ // Symbols in memory 'DMv_bankB':
72
+ // Symbols in memory 'DMv_bankBC':
73
+ // Symbols in memory 'DMv_bankBD':
74
+ // Symbols in memory 'DMv_bankC':
75
+ // Symbols in memory 'DMv_bankCD':
76
+ // Symbols in memory 'DMv_bankD':
77
+ // Symbols in memory 'DMv_stack':
78
+ // Symbols in memory 'DMw':
79
+ // Symbols in memory 'DMw_bankA':
80
+ // Symbols in memory 'DMw_bankAB':
81
+ // Symbols in memory 'DMw_bankAC':
82
+ // Symbols in memory 'DMw_bankAD':
83
+ // Symbols in memory 'DMw_bankB':
84
+ // Symbols in memory 'DMw_bankBC':
85
+ // Symbols in memory 'DMw_bankBD':
86
+ // Symbols in memory 'DMw_bankC':
87
+ // Symbols in memory 'DMw_bankCD':
88
+ // Symbols in memory 'DMw_bankD':
89
+ // Symbols in memory 'DMw_stack':
90
+ // Symbols in memory 'DMx':
91
+ // Symbols in memory 'DMx_bankA':
92
+ // Symbols in memory 'DMx_bankAB':
93
+ // Symbols in memory 'DMx_bankAC':
94
+ // Symbols in memory 'DMx_bankAD':
95
+ // Symbols in memory 'DMx_bankB':
96
+ // Symbols in memory 'DMx_bankBC':
97
+ // Symbols in memory 'DMx_bankBD':
98
+ // Symbols in memory 'DMx_bankC':
99
+ // Symbols in memory 'DMx_bankCD':
100
+ // Symbols in memory 'DMx_bankD':
101
+ // Symbols in memory 'DMx_stack':
102
+ // Symbols in memory 'PM':
103
+ _symbol _Z18pm_reload_analysisv 0x00000000
104
+ _symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000be0
105
+ _symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001180
106
+ _symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001290
107
+ _symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001c00
108
+ _symbol _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E 0x00001e40
109
+ _symbol _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv 0x00001e60
110
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E 0x00001f10
111
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00001f50
112
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00001f90
113
+ _symbol _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E 0x000020d0
114
+ _symbol _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002150
115
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002340
116
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x000023b0
117
+ _symbol _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000024b0
118
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x000026a0
119
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002720
120
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E 0x00002990
121
+ _symbol _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002a30
122
+ _symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002c20
123
+ _symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002c60
124
+ _symbol _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002de0
125
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002fd0
126
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00003010
127
+ _symbol _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000033e0
128
+ _symbol _Z22setup_avgpool2d_paramsI8bfloat16EvPT_R25avgpool2d_internal_paramsIS1_Eh 0x000035d0
129
+ _symbol _Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E 0x000038e0
130
+ _symbol _Z19superkernel_avgpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00003c80
131
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00003e80
132
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00003f00
133
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00003f70
134
+ _symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00003f80
135
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x000041e0
136
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00004200
137
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00004290
138
+ _symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x000043c0
139
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00004620
140
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x000046a0
141
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E 0x000046f0
142
+ _symbol _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00004700
143
+ _symbol _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params 0x00004c00
144
+ _symbol _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00004ee0
145
+ _symbol _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv 0x000050c0
146
+ _symbol _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t 0x00005700
147
+ _symbol _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E 0x000059a0
148
+ _symbol _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00006420
149
+ _symbol _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE 0x00006ea0
150
+ _symbol _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj 0x00007310
151
+ _symbol _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj 0x00007940
152
+ _symbol _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params 0x00007b20
153
+ _symbol _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj 0x00007e30
154
+ _symbol _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj 0x000080e0
155
+ _symbol _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params 0x00008130
156
+ _symbol _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj 0x00008300
157
+ _symbol _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params 0x00008380
158
+ _symbol _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj 0x00009250
159
+ _symbol _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj 0x000097b0
160
+ _symbol _ZN12me_primitive10udiv_dstepEjjRjS0_ 0x00009af0
161
+ _symbol int32_to_float32 0x00009da0
162
+ _symbol float32_add 0x0000a380
163
+ // Symbols in memory 'PMw':
164
+ // Symbols in memory 'TM4':
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/Release/pm_reload_analysis0.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/pm_reload_analysis0.log ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/scripts/pm_reload_analysis0.bcf ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _entry_point _Z18pm_reload_analysisv
2
+ _symbol _Z18pm_reload_analysisv 0
3
+ _reserved DMb 0x00000 0x40000
4
+ //South-------------------------------------------------
5
+ _reserved DMb 0x40000 0x10000
6
+ //West-------------------------------------------------
7
+ _reserved DMb 0x50000 0x10000
8
+ //North-------------------------------------------------
9
+ _reserved DMb 0x60000 0x10000
10
+ //East-------------------------------------------------
11
+ _stack DM_stack 0x70000 0x8000
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/scripts/pm_reload_analysis0.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <file type="lbc" name="pm_reload_analysis0.ll" path="../../ir"/>
3
+ <issinit/>
4
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
5
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
6
+ <option id="llvm.lang" value="Follow file extension"/>
7
+ <option id="bridge.cfg" value="pm_reload_analysis0.bcf"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/pm_reload_analysis0"/>
10
+ <option id="project.name" value="pm_reload_analysis0"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/src/pm_reload_analysis0.cc ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+
8
+ // Declare Kernel functions and initializers
9
+ #include "resize_adf_wrapper.cpp"
10
+ #include "slice_adf_wrapper.cpp"
11
+ void superkernel_mul1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
12
+ void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
13
+ void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
14
+ void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
15
+ void superkernel_add1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
16
+ void superkernel_clip1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
17
+ void superkernel_conv2d_dwc(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
18
+ void superkernel_conv_eltbinary(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,const unsigned int (&)[17],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
19
+ void superkernel_reduce_mean_c8(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
20
+ void superkernel_sigmoid1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
21
+ void superkernel_sub1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
22
+ void superkernel_tanh1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
23
+ void superkernel_avgpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
24
+ #include "transpose4d_adf_wrapper.cpp"
25
+ #include "concat_adf_wrapper.cpp"
26
+
27
+ // Declare Kernel objects and external arrays
28
+
29
+ void pm_reload_analysis()
30
+ {
31
+ //generate kernel calls with dummy parameters for call tree analysis
32
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1009_pi0 = { }; //dummy buffer port object
33
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> output_buffer_i1009_po0 = { }; //dummy buffer port object
34
+
35
+ mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 2>(input_buffer_i1009_pi0, output_buffer_i1009_po0, {32, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 48});
36
+
37
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1057_pi0 = { }; //dummy buffer port object
38
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> output_buffer_i1057_po0 = { }; //dummy buffer port object
39
+
40
+ mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(input_buffer_i1057_pi0, output_buffer_i1057_po0, {8, 3, 40, 3, 4, 1, 3840});
41
+
42
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1100_pi0 = { }; //dummy buffer port object
43
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1100_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
44
+
45
+ superkernel_mul1d_attribute_broadcasting(input_buffer_i1100_pi0, {1920, 0, 524288, 998244353, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, output_buffer_i1100_po0);
46
+
47
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1120_pi0 = { }; //dummy buffer port object
48
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> input_buffer_i1120_pi2 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
49
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1120_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
50
+
51
+ superkernel_add1d(input_buffer_i1120_pi0, {640, 0, 11796480, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, input_buffer_i1120_pi2, output_buffer_i1120_po0);
52
+
53
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1140_pi0 = { }; //dummy buffer port object
54
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> input_buffer_i1140_pi2 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
55
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1140_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
56
+
57
+ superkernel_mul1d(input_buffer_i1140_pi0, {640, 0, 11796480, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, input_buffer_i1140_pi2, output_buffer_i1140_po0);
58
+
59
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1160_pi0 = { }; //dummy buffer port object
60
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1160_pi1 = { }; //dummy buffer port object
61
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1160_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
62
+
63
+ conv2d_maxpool(input_buffer_i1160_pi0, input_buffer_i1160_pi1, {526914, 50528264, 16912640, 16256, 327744, 65542, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, output_buffer_i1160_po0);
64
+
65
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1180_pi0 = { }; //dummy buffer port object
66
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1180_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
67
+
68
+ superkernel_add1d_attribute_broadcasting(input_buffer_i1180_pi0, {1472, 0, 1310720, 1077936129, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, output_buffer_i1180_po0);
69
+
70
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1200_pi0 = { }; //dummy buffer port object
71
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1200_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
72
+
73
+ superkernel_clip1d(input_buffer_i1200_pi0, {1920, 0, 16, 0, 0, 0, 0, 0, 0, 16576, 0, 0, 0, 0, 0, 0}, output_buffer_i1200_po0);
74
+
75
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1260_pi0 = { }; //dummy buffer port object
76
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1260_pi1 = { }; //dummy buffer port object
77
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1260_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
78
+
79
+ superkernel_conv2d_dwc(input_buffer_i1260_pi0, input_buffer_i1260_pi1, {17303570, 66307, 1280, 40, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, output_buffer_i1260_po0);
80
+
81
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1280_pi0 = { }; //dummy buffer port object
82
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1280_pi1 = { }; //dummy buffer port object
83
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> input_buffer_i1280_pi2 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
84
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1280_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
85
+
86
+ superkernel_conv_eltbinary(input_buffer_i1280_pi0, input_buffer_i1280_pi1, input_buffer_i1280_pi2, {4194848, 16842760, 16908288, 16256, 327744, 65548, 0, 0, 512, 0, 3932160, 0, 0, 0, 0, 0, 0}, output_buffer_i1280_po0);
87
+
88
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i1460_pi0 = { }; //dummy buffer port object
89
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i1460_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
90
+
91
+ superkernel_reduce_mean_c8(input_buffer_i1460_pi0, {1, 32, 64, 2, 1, 1, 15, 0, 14990, 0, 15, 920, 1, 72, 0, 0}, output_buffer_i1460_po0);
92
+
93
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i4840_pi0 = { }; //dummy buffer port object
94
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i4840_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
95
+
96
+ superkernel_sigmoid1d(input_buffer_i4840_pi0, {512, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, output_buffer_i4840_po0);
97
+
98
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i4920_pi0 = { }; //dummy buffer port object
99
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> input_buffer_i4920_pi2 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
100
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i4920_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
101
+
102
+ superkernel_sub1d(input_buffer_i4920_pi0, {960, 0, 65536, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, input_buffer_i4920_pi2, output_buffer_i4920_po0);
103
+
104
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i5000_pi0 = { }; //dummy buffer port object
105
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i5000_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
106
+
107
+ superkernel_tanh1d(input_buffer_i5000_pi0, {960, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, output_buffer_i5000_po0);
108
+
109
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i5060_pi0 = { }; //dummy buffer port object
110
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::async, adf::addressing::linear, adf::margin<0>>> output_buffer_i5060_po0 = {(bfloat16*)0x0, 0, (bfloat16*)0x0, 0}; //dummy buffer port object
111
+
112
+ superkernel_avgpool(input_buffer_i5060_pi0, {0, 0, 0, 0, 0, 0, 0, 0, 524880, 258, 0, 0, 83886080, 96, 1048576000, 0}, output_buffer_i5060_po0);
113
+
114
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i719_pi0 = { }; //dummy buffer port object
115
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> output_buffer_i719_po0 = { }; //dummy buffer port object
116
+
117
+ mllib_graphs::transpose4d_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(input_buffer_i719_pi0, output_buffer_i719_po0, {1, 4, 8, 1, 1});
118
+
119
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i802_pi0 = { }; //dummy buffer port object
120
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> output_buffer_i802_po0 = { }; //dummy buffer port object
121
+
122
+ mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 0>(input_buffer_i802_pi0, output_buffer_i802_po0, {12, 20, 1056964608, 1056964608, 3196059648, 3196059648, 4, 17563928, 19398913, 16843028, 17563936, 35651841, 16909073, 0, 0, 2});
123
+
124
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i897_pi0 = { }; //dummy buffer port object
125
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::in, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> input_buffer_i897_pi1 = { }; //dummy buffer port object
126
+ adf::_io_buffer_light_weight< bfloat16, adf::direction::out, adf::io_buffer_config< adf::extents<>, adf::locking::sync, adf::addressing::linear, adf::margin<0>>> output_buffer_i897_po0 = { }; //dummy buffer port object
127
+
128
+ mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(input_buffer_i897_pi0, input_buffer_i897_pi1, output_buffer_i897_po0, {24, 24, 40, 25, 20, 20, 0, 0});
129
+
130
+ return;
131
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/timestamped_log/pm_reload_analysis0.log ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/pm_reload_analysis0/xlopt.log ADDED
@@ -0,0 +1,623 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
2
+
3
+
4
+ --------------- FILTER ANALYSIS INFO LOG ---------------
5
+
6
+ Reading Header IR from ir/_header.ll
7
+
8
+ --------------------------------------------------------
9
+
10
+ Add module pass 363{anonymous}::GuidancePass
11
+ Add module pass 363{anonymous}::ChessOptionsPass
12
+ Add module pass 363{anonymous}::DisableInliningInMainPass
13
+ Add module pass 363cdno::xlopt::AIEMergeSubWordStoresOpt
14
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::PromotePass>
15
+ Add module pass 363{anonymous}::IpConstPropPass
16
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::SimplifyCFGPass>
17
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::LoopSimplifyPass>
18
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::FunctionToLoopPassAdaptor>
19
+ Add module pass 363{anonymous}::XLModuleAdaptor<{anonymous}::AIELoopInfoPass>
20
+ Add module pass 363cdno::xlopt::AIEAnnotatePragmaPass
21
+ Add module pass 363{anonymous}::XLModuleAdaptor<{anonymous}::AIELoopPeelPass>
22
+ Add module pass 363{anonymous}::AIEAliasAnalysisPass
23
+
24
+
25
+ --------------- MEMORY MANAGEMENT GUIDANCE LOG ---------------
26
+
27
+ ALIGNMENT_HINT: Alignment of global array constinit is 4 bytes; automatically aligning it to 64 bytes.
28
+ ALIGNMENT_HINT: Alignment of global array constinit.1 is 4 bytes; automatically aligning it to 64 bytes.
29
+ ALIGNMENT_HINT: Alignment of global array constinit.7 is 4 bytes; automatically aligning it to 64 bytes.
30
+ ALIGNMENT_HINT: Alignment of global array constinit.9 is 4 bytes; automatically aligning it to 64 bytes.
31
+ ALIGNMENT_HINT: Alignment of global array constinit.10 is 4 bytes; automatically aligning it to 64 bytes.
32
+ ALIGNMENT_HINT: Alignment of global array constinit.14 is 4 bytes; automatically aligning it to 64 bytes.
33
+ ALIGNMENT_HINT: Alignment of global array constinit.15 is 4 bytes; automatically aligning it to 64 bytes.
34
+ ALIGNMENT_HINT: Alignment of global array constinit.16 is 4 bytes; automatically aligning it to 64 bytes.
35
+ ALIGNMENT_HINT: Alignment of global array constinit.17 is 4 bytes; automatically aligning it to 64 bytes.
36
+ ALIGNMENT_HINT: Alignment of global array __const._Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj.coeffs is 2 bytes; automatically aligning it to 64 bytes.
37
+ ALIGNMENT_HINT: Alignment of global array __const._Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj.coeffs_asymmetric is 2 bytes; automatically aligning it to 64 bytes.
38
+ SIZE_HINT: Global array sigmoid_lut<0u, 256u>::data_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
39
+ SIZE_HINT: Global array sigmoid_lut<0u, 256u>::data_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
40
+ SIZE_HINT: Global array gelu_lut_32<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
41
+ SIZE_HINT: Global array gelu_lut_32<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
42
+ SIZE_HINT: Global array tanh_lut<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
43
+ SIZE_HINT: Global array tanh_lut<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
44
+ SIZE_HINT: Global array log_f32_lut<256u>::fraction_table_ab_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
45
+ SIZE_HINT: Global array log_f32_lut<256u>::fraction_table_cd_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
46
+ SIZE_HINT: Global array exp2_lut<512u>::exp2_table_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
47
+ SIZE_HINT: Global array exp2_lut<512u>::exp2_table_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
48
+
49
+ --------------------------------------------------------------
50
+
51
+
52
+
53
+ --------------- MERGING SUBWORD STORES OPT LOG ---------------
54
+
55
+
56
+
57
+ --------------- LOOP STATISTICS : _ZN18conv2d_bf16_paramsC2Ev ---------------
58
+
59
+ Total loops = 1
60
+ Loops with prepare for pipelining pragma = 0
61
+ Loops with unroll pragma = 0
62
+ Loops with flatten pragma = 0
63
+ Loops with min range pragma = 0
64
+ Loops with max range pragma = 0
65
+ Loops with known trip count = 0
66
+
67
+ -----------------------------------------------------------------------------
68
+
69
+
70
+
71
+ --------------- LOOP STATISTICS : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh ---------------
72
+
73
+ Total loops = 1
74
+ Loops with prepare for pipelining pragma = 0
75
+ Loops with unroll pragma = 0
76
+ Loops with flatten pragma = 0
77
+ Loops with min range pragma = 0
78
+ Loops with max range pragma = 0
79
+ Loops with known trip count = 1
80
+
81
+ -------------------------------------------------------------------------------------------------------------------
82
+
83
+
84
+
85
+ --------------- LOOP STATISTICS : _Z14conv2d_genericILh1EL5act_t0ELb0ELb1ELb0E8bfloat16EvPS1_S2_S2_S2_R18conv2d_bf16_params10out_mode_t ---------------
86
+
87
+ Total loops = 4
88
+ Loops with prepare for pipelining pragma = 4
89
+ Loops with unroll pragma = 0
90
+ Loops with flatten pragma = 0
91
+ Loops with min range pragma = 4
92
+ Loops with max range pragma = 0
93
+ Loops with known trip count = 0
94
+
95
+ -------------------------------------------------------------------------------------------------------------------------------------------------------
96
+
97
+
98
+
99
+ --------------- LOOP STATISTICS : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams ---------------
100
+
101
+ Total loops = 1
102
+ Loops with prepare for pipelining pragma = 1
103
+ Loops with unroll pragma = 0
104
+ Loops with flatten pragma = 0
105
+ Loops with min range pragma = 1
106
+ Loops with max range pragma = 0
107
+ Loops with known trip count = 0
108
+
109
+ -------------------------------------------------------------------------------------------------------------------
110
+
111
+
112
+
113
+ --------------- LOOP STATISTICS : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E ---------------
114
+
115
+ Total loops = 1
116
+ Loops with prepare for pipelining pragma = 1
117
+ Loops with unroll pragma = 0
118
+ Loops with flatten pragma = 0
119
+ Loops with min range pragma = 1
120
+ Loops with max range pragma = 0
121
+ Loops with known trip count = 0
122
+
123
+ ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
124
+
125
+
126
+
127
+ --------------- LOOP STATISTICS : _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj32EEELj2EEC2Ev ---------------
128
+
129
+ Total loops = 1
130
+ Loops with prepare for pipelining pragma = 0
131
+ Loops with unroll pragma = 0
132
+ Loops with flatten pragma = 0
133
+ Loops with min range pragma = 0
134
+ Loops with max range pragma = 0
135
+ Loops with known trip count = 0
136
+
137
+ --------------------------------------------------------------------------------------------------------
138
+
139
+
140
+
141
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
142
+
143
+ Total loops = 1
144
+ Loops with prepare for pipelining pragma = 1
145
+ Loops with unroll pragma = 0
146
+ Loops with flatten pragma = 0
147
+ Loops with min range pragma = 1
148
+ Loops with max range pragma = 0
149
+ Loops with known trip count = 0
150
+
151
+ -----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
152
+
153
+
154
+
155
+ --------------- LOOP STATISTICS : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE ---------------
156
+
157
+ Total loops = 1
158
+ Loops with prepare for pipelining pragma = 1
159
+ Loops with unroll pragma = 0
160
+ Loops with flatten pragma = 0
161
+ Loops with min range pragma = 1
162
+ Loops with max range pragma = 0
163
+ Loops with known trip count = 0
164
+
165
+ ---------------------------------------------------------------------------------------------------------------------------------------------------------------
166
+
167
+
168
+
169
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
170
+
171
+ Total loops = 1
172
+ Loops with prepare for pipelining pragma = 1
173
+ Loops with unroll pragma = 0
174
+ Loops with flatten pragma = 0
175
+ Loops with min range pragma = 1
176
+ Loops with max range pragma = 0
177
+ Loops with known trip count = 0
178
+
179
+ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
180
+
181
+
182
+
183
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
184
+
185
+ Total loops = 1
186
+ Loops with prepare for pipelining pragma = 1
187
+ Loops with unroll pragma = 0
188
+ Loops with flatten pragma = 0
189
+ Loops with min range pragma = 1
190
+ Loops with max range pragma = 0
191
+ Loops with known trip count = 0
192
+
193
+ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
194
+
195
+
196
+
197
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj32EEC2Eb ---------------
198
+
199
+ Total loops = 2
200
+ Loops with prepare for pipelining pragma = 0
201
+ Loops with unroll pragma = 2
202
+ Loops with flatten pragma = 0
203
+ Loops with min range pragma = 0
204
+ Loops with max range pragma = 0
205
+ Loops with known trip count = 2
206
+
207
+ -------------------------------------------------------------------------
208
+
209
+
210
+
211
+ --------------- LOOP STATISTICS : _Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E ---------------
212
+
213
+ Total loops = 1
214
+ Loops with prepare for pipelining pragma = 1
215
+ Loops with unroll pragma = 0
216
+ Loops with flatten pragma = 0
217
+ Loops with min range pragma = 1
218
+ Loops with max range pragma = 0
219
+ Loops with known trip count = 0
220
+
221
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------
222
+
223
+
224
+
225
+ --------------- LOOP STATISTICS : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E ---------------
226
+
227
+ Total loops = 1
228
+ Loops with prepare for pipelining pragma = 1
229
+ Loops with unroll pragma = 0
230
+ Loops with flatten pragma = 0
231
+ Loops with min range pragma = 1
232
+ Loops with max range pragma = 0
233
+ Loops with known trip count = 0
234
+
235
+ ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------
236
+
237
+
238
+
239
+ --------------- LOOP STATISTICS : _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh ---------------
240
+
241
+ Total loops = 1
242
+ Loops with prepare for pipelining pragma = 0
243
+ Loops with unroll pragma = 0
244
+ Loops with flatten pragma = 0
245
+ Loops with min range pragma = 0
246
+ Loops with max range pragma = 0
247
+ Loops with known trip count = 1
248
+
249
+ --------------------------------------------------------------------------------------------------------------
250
+
251
+
252
+
253
+ --------------- LOOP STATISTICS : _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params ---------------
254
+
255
+ Total loops = 2
256
+ Loops with prepare for pipelining pragma = 2
257
+ Loops with unroll pragma = 0
258
+ Loops with flatten pragma = 0
259
+ Loops with min range pragma = 2
260
+ Loops with max range pragma = 0
261
+ Loops with known trip count = 0
262
+
263
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
264
+
265
+
266
+
267
+ --------------- LOOP STATISTICS : _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E ---------------
268
+
269
+ Total loops = 2
270
+ Loops with prepare for pipelining pragma = 1
271
+ Loops with unroll pragma = 0
272
+ Loops with flatten pragma = 0
273
+ Loops with min range pragma = 1
274
+ Loops with max range pragma = 0
275
+ Loops with known trip count = 0
276
+
277
+ ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
278
+
279
+
280
+
281
+ --------------- LOOP STATISTICS : _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj16EEELj4EEC2Ev ---------------
282
+
283
+ Total loops = 1
284
+ Loops with prepare for pipelining pragma = 0
285
+ Loops with unroll pragma = 0
286
+ Loops with flatten pragma = 0
287
+ Loops with min range pragma = 0
288
+ Loops with max range pragma = 0
289
+ Loops with known trip count = 0
290
+
291
+ --------------------------------------------------------------------------------------------------------
292
+
293
+
294
+
295
+ --------------- LOOP STATISTICS : _ZN19reduce_mean_c8_implI8bfloat16E16body_postprocessEPvR18reduce_c8_params_tI23reduce_mean_c8_params_tIS0_EE ---------------
296
+
297
+ Total loops = 2
298
+ Loops with prepare for pipelining pragma = 2
299
+ Loops with unroll pragma = 0
300
+ Loops with flatten pragma = 0
301
+ Loops with min range pragma = 2
302
+ Loops with max range pragma = 0
303
+ Loops with known trip count = 0
304
+
305
+ ---------------------------------------------------------------------------------------------------------------------------------------------------------------
306
+
307
+
308
+
309
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj8EEC2Eb ---------------
310
+
311
+ Total loops = 2
312
+ Loops with prepare for pipelining pragma = 0
313
+ Loops with unroll pragma = 2
314
+ Loops with flatten pragma = 0
315
+ Loops with min range pragma = 0
316
+ Loops with max range pragma = 0
317
+ Loops with known trip count = 2
318
+
319
+ ------------------------------------------------------------------------
320
+
321
+
322
+
323
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj16EEC2Eb ---------------
324
+
325
+ Total loops = 2
326
+ Loops with prepare for pipelining pragma = 0
327
+ Loops with unroll pragma = 2
328
+ Loops with flatten pragma = 0
329
+ Loops with min range pragma = 0
330
+ Loops with max range pragma = 0
331
+ Loops with known trip count = 2
332
+
333
+ -------------------------------------------------------------------------
334
+
335
+
336
+
337
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj8EEeqERKS1_ ---------------
338
+
339
+ Total loops = 1
340
+ Loops with prepare for pipelining pragma = 0
341
+ Loops with unroll pragma = 1
342
+ Loops with flatten pragma = 0
343
+ Loops with min range pragma = 0
344
+ Loops with max range pragma = 0
345
+ Loops with known trip count = 1
346
+
347
+ -----------------------------------------------------------------------------
348
+
349
+
350
+
351
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj16EEeqERKS1_ ---------------
352
+
353
+ Total loops = 1
354
+ Loops with prepare for pipelining pragma = 0
355
+ Loops with unroll pragma = 1
356
+ Loops with flatten pragma = 0
357
+ Loops with min range pragma = 0
358
+ Loops with max range pragma = 0
359
+ Loops with known trip count = 1
360
+
361
+ ------------------------------------------------------------------------------
362
+
363
+
364
+
365
+ --------------- LOOP STATISTICS : _Z26pad_3d_bfloat16_simplifiedP8bfloat16S0_R15pad_3d_params_t ---------------
366
+
367
+ Total loops = 3
368
+ Loops with prepare for pipelining pragma = 0
369
+ Loops with unroll pragma = 0
370
+ Loops with flatten pragma = 0
371
+ Loops with min range pragma = 0
372
+ Loops with max range pragma = 0
373
+ Loops with known trip count = 0
374
+
375
+ ---------------------------------------------------------------------------------------------------------------
376
+
377
+
378
+
379
+ --------------- LOOP STATISTICS : _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj ---------------
380
+
381
+ Total loops = 1
382
+ Loops with prepare for pipelining pragma = 0
383
+ Loops with unroll pragma = 0
384
+ Loops with flatten pragma = 0
385
+ Loops with min range pragma = 0
386
+ Loops with max range pragma = 0
387
+ Loops with known trip count = 1
388
+
389
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
390
+
391
+
392
+
393
+ --------------- LOOP STATISTICS : _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj ---------------
394
+
395
+ Total loops = 1
396
+ Loops with prepare for pipelining pragma = 0
397
+ Loops with unroll pragma = 0
398
+ Loops with flatten pragma = 0
399
+ Loops with min range pragma = 0
400
+ Loops with max range pragma = 0
401
+ Loops with known trip count = 1
402
+
403
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
404
+
405
+
406
+
407
+ --------------- LOOP STATISTICS : _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj ---------------
408
+
409
+ Total loops = 4
410
+ Loops with prepare for pipelining pragma = 0
411
+ Loops with unroll pragma = 0
412
+ Loops with flatten pragma = 0
413
+ Loops with min range pragma = 0
414
+ Loops with max range pragma = 0
415
+ Loops with known trip count = 0
416
+
417
+ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
418
+
419
+
420
+
421
+ --------------- LOOP STATISTICS : _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params ---------------
422
+
423
+ Total loops = 3
424
+ Loops with prepare for pipelining pragma = 1
425
+ Loops with unroll pragma = 0
426
+ Loops with flatten pragma = 0
427
+ Loops with min range pragma = 1
428
+ Loops with max range pragma = 0
429
+ Loops with known trip count = 0
430
+
431
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------
432
+
433
+
434
+
435
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj32EEeqERKS1_ ---------------
436
+
437
+ Total loops = 1
438
+ Loops with prepare for pipelining pragma = 0
439
+ Loops with unroll pragma = 1
440
+ Loops with flatten pragma = 0
441
+ Loops with min range pragma = 0
442
+ Loops with max range pragma = 0
443
+ Loops with known trip count = 1
444
+
445
+ ------------------------------------------------------------------------------
446
+
447
+
448
+
449
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj32EE6insertILj32EEERS1_jRKNS0_IXT_EEE ---------------
450
+
451
+ Total loops = 1
452
+ Loops with prepare for pipelining pragma = 0
453
+ Loops with unroll pragma = 0
454
+ Loops with flatten pragma = 0
455
+ Loops with min range pragma = 0
456
+ Loops with max range pragma = 0
457
+ Loops with known trip count = 1
458
+
459
+ ------------------------------------------------------------------------------------------------------
460
+
461
+
462
+
463
+ --------------- LOOP STATISTICS : _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj ---------------
464
+
465
+ Total loops = 1
466
+ Loops with prepare for pipelining pragma = 0
467
+ Loops with unroll pragma = 0
468
+ Loops with flatten pragma = 0
469
+ Loops with min range pragma = 0
470
+ Loops with max range pragma = 0
471
+ Loops with known trip count = 1
472
+
473
+ -------------------------------------------------------------------------------------------------------------------------------
474
+
475
+
476
+
477
+ --------------- LOOP STATISTICS : _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params ---------------
478
+
479
+ Total loops = 1
480
+ Loops with prepare for pipelining pragma = 0
481
+ Loops with unroll pragma = 0
482
+ Loops with flatten pragma = 0
483
+ Loops with min range pragma = 0
484
+ Loops with max range pragma = 0
485
+ Loops with known trip count = 0
486
+
487
+ --------------------------------------------------------------------------------------------------------------------------------------------------------
488
+
489
+
490
+
491
+ --------------- LOOP STATISTICS : _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params ---------------
492
+
493
+ Total loops = 2
494
+ Loops with prepare for pipelining pragma = 1
495
+ Loops with unroll pragma = 0
496
+ Loops with flatten pragma = 0
497
+ Loops with min range pragma = 0
498
+ Loops with max range pragma = 0
499
+ Loops with known trip count = 0
500
+
501
+ --------------------------------------------------------------------------------------------------------
502
+
503
+
504
+
505
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj64EEC2Eb ---------------
506
+
507
+ Total loops = 2
508
+ Loops with prepare for pipelining pragma = 0
509
+ Loops with unroll pragma = 2
510
+ Loops with flatten pragma = 0
511
+ Loops with min range pragma = 0
512
+ Loops with max range pragma = 0
513
+ Loops with known trip count = 2
514
+
515
+ -------------------------------------------------------------------------
516
+
517
+
518
+
519
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj64EEeqERKS1_ ---------------
520
+
521
+ Total loops = 1
522
+ Loops with prepare for pipelining pragma = 0
523
+ Loops with unroll pragma = 1
524
+ Loops with flatten pragma = 0
525
+ Loops with min range pragma = 0
526
+ Loops with max range pragma = 0
527
+ Loops with known trip count = 1
528
+
529
+ ------------------------------------------------------------------------------
530
+
531
+
532
+
533
+ --------------- LOOP STATISTICS : _Z7maskgenIyLj16EET_jj ---------------
534
+
535
+ Total loops = 1
536
+ Loops with prepare for pipelining pragma = 0
537
+ Loops with unroll pragma = 0
538
+ Loops with flatten pragma = 0
539
+ Loops with min range pragma = 0
540
+ Loops with max range pragma = 0
541
+ Loops with known trip count = 1
542
+
543
+ ------------------------------------------------------------------------
544
+
545
+
546
+
547
+ --------------- LOOP STATISTICS : _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj ---------------
548
+
549
+ Total loops = 6
550
+ Loops with prepare for pipelining pragma = 2
551
+ Loops with unroll pragma = 0
552
+ Loops with flatten pragma = 0
553
+ Loops with min range pragma = 0
554
+ Loops with max range pragma = 0
555
+ Loops with known trip count = 0
556
+
557
+ ------------------------------------------------------------------------------------------------------------------------------------------
558
+
559
+
560
+
561
+ --------------- PRAGMA INSERTION LOG (unroll threshold = 3000, max unroll factor = 1) ---------------
562
+
563
+ Adding pragma to function _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh :
564
+ Pragma added to loop at line 437 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common/../../include/conv/conv2d_bf16_params.h : chess_loop_range(8,8)
565
+ Adding pragma to function _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj32EEELj2EEC2Ev :
566
+ Pragma added to loop at line 135 in file /usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite/../include/array : chess_prepare_for_pipelining
567
+ Adding pragma to function _ZN3aie4maskILj32EEC2Eb :
568
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
569
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
570
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
571
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
572
+ Adding pragma to function _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh :
573
+ Pragma added to loop at line 214 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common/../../include/conv/conv2d_dw_bf16_params.h : chess_loop_range(4,4)
574
+ Adding pragma to function _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj16EEELj4EEC2Ev :
575
+ Pragma added to loop at line 135 in file /usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite/../include/array : chess_prepare_for_pipelining
576
+ Adding pragma to function _ZN3aie4maskILj8EEC2Eb :
577
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
578
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
579
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
580
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
581
+ Adding pragma to function _ZN3aie4maskILj16EEC2Eb :
582
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
583
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
584
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
585
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
586
+ Adding pragma to function _ZNK3aie4maskILj16EEeqERKS1_ :
587
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
588
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
589
+ Adding pragma to function _ZNK3aie4maskILj8EEeqERKS1_ :
590
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
591
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
592
+ Adding pragma to function _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj :
593
+ Pragma added to loop at line 283 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/resize_bilinear.h : chess_prepare_for_pipelining
594
+ Pragma added to loop at line 262 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/resize_bilinear.h : chess_prepare_for_pipelining
595
+ Adding pragma to function _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj :
596
+ Pragma added to loop at line 81 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp : chess_loop_range(6,6)
597
+ Adding pragma to function _Z7maskgenIyLj16EET_jj :
598
+ Pragma added to loop at line 25 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/slice_hcwc8_params.h : chess_loop_range(4,4)
599
+ Adding pragma to function _ZN3aie4maskILj64EEC2Eb :
600
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
601
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
602
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(2,2)
603
+ Adding pragma to function _ZNK3aie4maskILj64EEeqERKS1_ :
604
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(2,2)
605
+ Adding pragma to function _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj :
606
+ Pragma added to loop at line 101 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/transposeshuffle_params.h : chess_loop_range(5,5)
607
+ Adding pragma to function _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params :
608
+ Pragma added to loop at line 81 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/transposeshuffle.h : chess_prepare_for_pipelining
609
+ Adding pragma to function _ZN3aie4maskILj32EE6insertILj32EEERS1_jRKNS0_IXT_EEE :
610
+ Pragma added to loop at line 565 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
611
+ Pragma added to loop at line 565 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
612
+ Adding pragma to function _ZNK3aie4maskILj32EEeqERKS1_ :
613
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
614
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
615
+ Adding pragma to function _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params :
616
+ Pragma added to loop at line 101 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/resize_bilinear.h : chess_prepare_for_pipelining
617
+ Adding pragma to function _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj :
618
+ Pragma added to loop at line 81 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/resize_adf_wrapper.cpp : chess_loop_range(6,6)
619
+ Adding pragma to function _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj :
620
+ Pragma added to loop at line 112 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf/concat_adf_wrapper.cpp : chess_prepare_for_pipelining
621
+
622
+ -----------------------------------------------------------------------------------------------------
623
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/ps/c_rts/aie_control.cpp ADDED
@@ -0,0 +1,293 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ /********************************************* Disclaimer *********************************************/
2
+ /* This file is generated by aiecompiler . */
3
+ /* Changes to this file may cause incorrect behavior and will be lost if aiecompiler is invoked again.*/
4
+
5
+ /************************** Constants/Macros *****************************/
6
+ #define HW_GEN XAIE_DEV_GEN_AIE2P
7
+ #define XAIE_NUM_ROWS 6
8
+ #define XAIE_NUM_COLS 8
9
+ #ifdef __AIE2IPU_BASE_ADDR_CDO__
10
+ #define XAIE_BASE_ADDR 0x0
11
+ #else
12
+ #define XAIE_BASE_ADDR 0x20000000000
13
+ #endif
14
+ #define XAIE_COL_SHIFT 25
15
+ #define XAIE_ROW_SHIFT 20
16
+ #define XAIE_SHIM_ROW 0
17
+ #define XAIE_MEM_TILE_ROW_START 1
18
+ #define XAIE_MEM_TILE_NUM_ROWS 1
19
+ #define XAIE_AIE_TILE_ROW_START 2
20
+ #define XAIE_AIE_TILE_NUM_ROWS 4
21
+ #define FOR_WRITE 0
22
+ #define FOR_READ 1
23
+ #if defined(__AIESIM__)
24
+ #define XAIE_PARTITION_BASE_ADDR (XAIE_BASE_ADDR)
25
+ #else
26
+ #define XAIE_PARTITION_BASE_ADDR 0x0
27
+ #endif
28
+
29
+ /***************************** Includes *********************************/
30
+ #include <fstream>
31
+ #include <adf.h>
32
+ extern "C"
33
+ {
34
+ #include <xaiengine.h>
35
+ }
36
+
37
+ #if defined(__CDO__) || defined(__AIECONTROLCODE__)
38
+ #include "adf/adf_api/common_layer/fal_util.h"
39
+ #endif
40
+
41
+ #include "adf/adf_api/AIEControlConfig.h"
42
+
43
+ XAie_InstDeclare(DevInst, &ConfigPtr); // Declare global device instance
44
+
45
+
46
+ /************************** Functions/APIs *****************************/
47
+ bool root_overlay_load_elf_pm(const std::string& work_dir)
48
+ {
49
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 2), (work_dir + "/aie/0_0/Release/0_0").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
50
+ {
51
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(0,0)" << std::endl;
52
+ return false;
53
+ }
54
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 3), (work_dir + "/aie/0_1/Release/0_1").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
55
+ {
56
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(0,1)" << std::endl;
57
+ return false;
58
+ }
59
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 4), (work_dir + "/aie/0_2/Release/0_2").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
60
+ {
61
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(0,2)" << std::endl;
62
+ return false;
63
+ }
64
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 5), (work_dir + "/aie/0_3/Release/0_3").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
65
+ {
66
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(0,3)" << std::endl;
67
+ return false;
68
+ }
69
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 2), (work_dir + "/aie/1_0/Release/1_0").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
70
+ {
71
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(1,0)" << std::endl;
72
+ return false;
73
+ }
74
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 3), (work_dir + "/aie/1_1/Release/1_1").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
75
+ {
76
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(1,1)" << std::endl;
77
+ return false;
78
+ }
79
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 4), (work_dir + "/aie/1_2/Release/1_2").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
80
+ {
81
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(1,2)" << std::endl;
82
+ return false;
83
+ }
84
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 5), (work_dir + "/aie/1_3/Release/1_3").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
85
+ {
86
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(1,3)" << std::endl;
87
+ return false;
88
+ }
89
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 2), (work_dir + "/aie/2_0/Release/2_0").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
90
+ {
91
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(2,0)" << std::endl;
92
+ return false;
93
+ }
94
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 3), (work_dir + "/aie/2_1/Release/2_1").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
95
+ {
96
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(2,1)" << std::endl;
97
+ return false;
98
+ }
99
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 4), (work_dir + "/aie/2_2/Release/2_2").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
100
+ {
101
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(2,2)" << std::endl;
102
+ return false;
103
+ }
104
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 5), (work_dir + "/aie/2_3/Release/2_3").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
105
+ {
106
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(2,3)" << std::endl;
107
+ return false;
108
+ }
109
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 2), (work_dir + "/aie/3_0/Release/3_0").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
110
+ {
111
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(3,0)" << std::endl;
112
+ return false;
113
+ }
114
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 3), (work_dir + "/aie/3_1/Release/3_1").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
115
+ {
116
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(3,1)" << std::endl;
117
+ return false;
118
+ }
119
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 4), (work_dir + "/aie/3_2/Release/3_2").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
120
+ {
121
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(3,2)" << std::endl;
122
+ return false;
123
+ }
124
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 5), (work_dir + "/aie/3_3/Release/3_3").c_str(), XAIE_LOAD_ELF_TXT, XAIE_ENABLE)!=XAIE_OK)
125
+ {
126
+ std::cerr << "ERROR: Failed to load program memory sections of ELF for core(3,3)" << std::endl;
127
+ return false;
128
+ }
129
+ return true;
130
+ }
131
+
132
+ bool root_overlay_load_elf_dm(const std::string& work_dir)
133
+ {
134
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 2), (work_dir + "/aie/0_0/Release/0_0").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
135
+ {
136
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(0,0)" << std::endl;
137
+ return false;
138
+ }
139
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 3), (work_dir + "/aie/0_1/Release/0_1").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
140
+ {
141
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(0,1)" << std::endl;
142
+ return false;
143
+ }
144
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 4), (work_dir + "/aie/0_2/Release/0_2").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
145
+ {
146
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(0,2)" << std::endl;
147
+ return false;
148
+ }
149
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(0, 5), (work_dir + "/aie/0_3/Release/0_3").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
150
+ {
151
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(0,3)" << std::endl;
152
+ return false;
153
+ }
154
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 2), (work_dir + "/aie/1_0/Release/1_0").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
155
+ {
156
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(1,0)" << std::endl;
157
+ return false;
158
+ }
159
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 3), (work_dir + "/aie/1_1/Release/1_1").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
160
+ {
161
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(1,1)" << std::endl;
162
+ return false;
163
+ }
164
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 4), (work_dir + "/aie/1_2/Release/1_2").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
165
+ {
166
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(1,2)" << std::endl;
167
+ return false;
168
+ }
169
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(1, 5), (work_dir + "/aie/1_3/Release/1_3").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
170
+ {
171
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(1,3)" << std::endl;
172
+ return false;
173
+ }
174
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 2), (work_dir + "/aie/2_0/Release/2_0").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
175
+ {
176
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(2,0)" << std::endl;
177
+ return false;
178
+ }
179
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 3), (work_dir + "/aie/2_1/Release/2_1").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
180
+ {
181
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(2,1)" << std::endl;
182
+ return false;
183
+ }
184
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 4), (work_dir + "/aie/2_2/Release/2_2").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
185
+ {
186
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(2,2)" << std::endl;
187
+ return false;
188
+ }
189
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(2, 5), (work_dir + "/aie/2_3/Release/2_3").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
190
+ {
191
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(2,3)" << std::endl;
192
+ return false;
193
+ }
194
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 2), (work_dir + "/aie/3_0/Release/3_0").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
195
+ {
196
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(3,0)" << std::endl;
197
+ return false;
198
+ }
199
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 3), (work_dir + "/aie/3_1/Release/3_1").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
200
+ {
201
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(3,1)" << std::endl;
202
+ return false;
203
+ }
204
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 4), (work_dir + "/aie/3_2/Release/3_2").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
205
+ {
206
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(3,2)" << std::endl;
207
+ return false;
208
+ }
209
+ if(XAie_LoadElfPartial(&DevInst, XAie_TileLoc(3, 5), (work_dir + "/aie/3_3/Release/3_3").c_str(), (XAIE_LOAD_ELF_BSS | XAIE_LOAD_ELF_DATA), XAIE_ENABLE)!=XAIE_OK)
210
+ {
211
+ std::cerr << "ERROR: Failed to load data memory sections of ELF for core(3,3)" << std::endl;
212
+ return false;
213
+ }
214
+ return true;
215
+ }
216
+
217
+ bool root_overlay_load_elf(const std::string& work_path, std::vector<std::string>& elfInfoPath)
218
+ {
219
+ #ifdef __PS_INIT_AIE__
220
+
221
+ // skip loading initial ELF in AIE simulation when it is done via control packets, but still gen code for CDO/ASM
222
+ #if defined(__CDO__) || defined(__AIECONTROLCODE__)
223
+ std::string work_dir = (work_path.empty() ? "Work" : work_path); root_overlay_load_elf_pm(work_dir);
224
+ root_overlay_load_elf_dm(work_dir);
225
+
226
+ #endif
227
+ #endif
228
+
229
+ return true;
230
+ }
231
+
232
+
233
+ /************************** AIE driver and ADF API initializer *****************************/
234
+
235
+ class InitializeAIEControl
236
+ {
237
+ public:
238
+ InitializeAIEControl()
239
+ {
240
+ XAie_SetupConfig(ConfigPtr, HW_GEN, XAIE_BASE_ADDR, XAIE_COL_SHIFT,
241
+ XAIE_ROW_SHIFT, XAIE_NUM_COLS, XAIE_NUM_ROWS,
242
+ XAIE_SHIM_ROW, XAIE_MEM_TILE_ROW_START,
243
+ XAIE_MEM_TILE_NUM_ROWS, XAIE_AIE_TILE_ROW_START,
244
+ XAIE_AIE_TILE_NUM_ROWS);
245
+
246
+ XAie_SetupPartitionConfig(&DevInst, XAIE_PARTITION_BASE_ADDR, 0, 4);
247
+
248
+ XAie_CfgInitialize(&(DevInst), &ConfigPtr);
249
+
250
+ #if defined(__CDO__)
251
+ XAie_SetIOBackend(&(DevInst), XAIE_IO_BACKEND_CDO); // Set aiengine driver library to run for CDO Mode
252
+ #elif defined(__AIECONTROLCODE__)
253
+ XAie_SetIOBackend(&(DevInst), XAIE_IO_BACKEND_CONTROLCODE); // Set aiengine driver library to run for CONTROLCODE Mode
254
+ #endif
255
+
256
+ #if defined(__AIESIM__)
257
+ XAie_TurnEccOff(&DevInst);
258
+ #endif
259
+
260
+ #if defined(__AIESIM__)
261
+ extern unsigned ess_debug;
262
+ #else
263
+ unsigned ess_debug = false;
264
+ #endif
265
+
266
+ #ifdef __EXCLUDE_PL_CONTROL__
267
+ bool exclude_pl_control = true;
268
+ #else
269
+ bool exclude_pl_control = false;
270
+ #endif
271
+
272
+ #ifdef __CDO__
273
+ int trace_config_stream_option = 2;
274
+ #else
275
+ int trace_config_stream_option = 0;
276
+ #endif
277
+
278
+ adf::initializeConfigurations(&DevInst, XAIE_NUM_COLS, XAIE_AIE_TILE_NUM_ROWS, XAIE_MEM_TILE_NUM_ROWS,
279
+ nullptr, 0,
280
+ nullptr, 0,
281
+ nullptr, 0,
282
+ nullptr, 0,
283
+ nullptr, 0,
284
+ nullptr, 0,
285
+ nullptr, 0,
286
+ nullptr, 0,
287
+ nullptr, 0,
288
+ nullptr, 0,
289
+ nullptr, 0, trace_config_stream_option, nullptr,
290
+ ess_debug, exclude_pl_control, false, nullptr, false, 0, 0);
291
+
292
+ }
293
+ } initAIEControl;