iswaalex commited on
Commit
c6746a7
·
verified ·
1 Parent(s): e35b401

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_101.bin +3 -0
  2. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_102.bin +3 -0
  3. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_103.bin +3 -0
  4. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_104.bin +3 -0
  5. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_105.bin +3 -0
  6. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_106.bin +3 -0
  7. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_107.bin +3 -0
  8. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_108.bin +3 -0
  9. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_109.bin +3 -0
  10. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/Release/3_3_reloadable23.sdr +125 -0
  11. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/Release/3_3_reloadable23.srv +0 -0
  12. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/Release/3_3_reloadable23.txt +0 -0
  13. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/scripts/3_3_reloadable23.bcf +16 -0
  14. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/scripts/3_3_reloadable23.prx +13 -0
  15. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/src/3_3_reloadable23.cc +124 -0
  16. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.calltree +88 -0
  17. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.cmic2 +0 -0
  18. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.cmico +1 -0
  19. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.lst +0 -0
  20. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.map +294 -0
  21. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.sdr +125 -0
  22. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.srv +0 -0
  23. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.txt +0 -0
  24. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/scripts/3_3_reloadable24.bcf +16 -0
  25. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/scripts/3_3_reloadable24.prx +13 -0
  26. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/src/3_3_reloadable24.cc +113 -0
  27. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.calltree +48 -0
  28. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.cmic2 +0 -0
  29. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.cmico +1 -0
  30. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.lst +0 -0
  31. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.map +161 -0
  32. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.sdr +100 -0
  33. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.srv +0 -0
  34. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.txt +0 -0
  35. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/scripts/3_3_reloadable25.bcf +16 -0
  36. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/scripts/3_3_reloadable25.prx +13 -0
  37. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/src/3_3_reloadable25.cc +66 -0
  38. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.calltree +88 -0
  39. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.cmic2 +0 -0
  40. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.cmico +1 -0
  41. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.lst +0 -0
  42. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.map +287 -0
  43. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.sdr +123 -0
  44. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.srv +0 -0
  45. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.txt +0 -0
  46. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/scripts/3_3_reloadable3.bcf +16 -0
  47. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/scripts/3_3_reloadable3.prx +13 -0
  48. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/src/3_3_reloadable3.cc +98 -0
  49. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable4/Release/3_3_reloadable4.calltree +54 -0
  50. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable4/Release/3_3_reloadable4.cmic2 +0 -0
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:066c42b39d21af0fb74290ec44e9c20a76b622afc78770782e7c4bd2650a3c5d
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12a3fc832c8cc699add45d397f677f51409f8a23f04eae2232fdbf7a849e94a2
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d2788e67436bb8c89b4af678724d7c40b798b226c3f3bda2e7b15c9bab5e9d6
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9cb44904cddab76168851801794dd62149f3293c61d89d395516def1168b6d3
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51a5d087b214a6996037451e928946277a3639f64111929703839fc43a79addb
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5a73e4da4d2bed15b96c8157fb7e388578bdff5031935c95c316ccf8ac954b6
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff412a4ea18fc0ba4a177d7344f1802b11ee5bad4613f2cf959331610b18cc70
3
+ size 376
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22979562f652566b01e54a355c363f99f4938c50e025bb399f03df329a928367
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_3/lcp/0_3_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:403a029188e743f7f1814a2d4703915229d5918c8dff3a3659c4bf467f7374da
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/Release/3_3_reloadable23.sdr ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:02:00 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable23 ../Release/0_0_reloadable23.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable23.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6583 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ // Symbols in memory 'DM_bankA':
9
+ // Symbols in memory 'DM_bankAB':
10
+ // Symbols in memory 'DM_bankAC':
11
+ // Symbols in memory 'DM_bankAD':
12
+ // Symbols in memory 'DM_bankB':
13
+ // Symbols in memory 'DM_bankBC':
14
+ // Symbols in memory 'DM_bankBD':
15
+ // Symbols in memory 'DM_bankC':
16
+ // Symbols in memory 'DM_bankCD':
17
+ // Symbols in memory 'DM_bankD':
18
+ // Symbols in memory 'DM_stack':
19
+ // Symbols in memory 'DM_test':
20
+ // Symbols in memory 'DMb':
21
+ _symbol _ZN12me_primitive11control_satE 0x0007c46c
22
+ _symbol _ZN12me_primitive11control_rndE 0x0007c470
23
+ _symbol add1d_params 0x0007c4c0
24
+ _symbol mul1d_params 0x0007c500
25
+ _symbol sub1d_params 0x0007c540
26
+ _symbol sigmoid1d_params 0x0007c580
27
+ _symbol tanh1d_params 0x0007c5c0
28
+ _symbol conv2d_params 0x0007c600
29
+ // Symbols in memory 'DMh':
30
+ // Symbols in memory 'DMh_bankA':
31
+ // Symbols in memory 'DMh_bankAB':
32
+ // Symbols in memory 'DMh_bankAC':
33
+ // Symbols in memory 'DMh_bankAD':
34
+ // Symbols in memory 'DMh_bankB':
35
+ // Symbols in memory 'DMh_bankBC':
36
+ // Symbols in memory 'DMh_bankBD':
37
+ // Symbols in memory 'DMh_bankC':
38
+ // Symbols in memory 'DMh_bankCD':
39
+ // Symbols in memory 'DMh_bankD':
40
+ // Symbols in memory 'DMh_stack':
41
+ // Symbols in memory 'DMs':
42
+ // Symbols in memory 'DMs_bankA':
43
+ // Symbols in memory 'DMs_bankAB':
44
+ // Symbols in memory 'DMs_bankAC':
45
+ // Symbols in memory 'DMs_bankAD':
46
+ // Symbols in memory 'DMs_bankB':
47
+ // Symbols in memory 'DMs_bankBC':
48
+ // Symbols in memory 'DMs_bankBD':
49
+ // Symbols in memory 'DMs_bankC':
50
+ // Symbols in memory 'DMs_bankCD':
51
+ // Symbols in memory 'DMs_bankD':
52
+ // Symbols in memory 'DMs_stack':
53
+ // Symbols in memory 'DMv':
54
+ // Symbols in memory 'DMv_bankA':
55
+ // Symbols in memory 'DMv_bankAB':
56
+ // Symbols in memory 'DMv_bankAC':
57
+ // Symbols in memory 'DMv_bankAD':
58
+ // Symbols in memory 'DMv_bankB':
59
+ // Symbols in memory 'DMv_bankBC':
60
+ // Symbols in memory 'DMv_bankBD':
61
+ // Symbols in memory 'DMv_bankC':
62
+ // Symbols in memory 'DMv_bankCD':
63
+ // Symbols in memory 'DMv_bankD':
64
+ // Symbols in memory 'DMv_stack':
65
+ // Symbols in memory 'DMw':
66
+ // Symbols in memory 'DMw_bankA':
67
+ // Symbols in memory 'DMw_bankAB':
68
+ // Symbols in memory 'DMw_bankAC':
69
+ // Symbols in memory 'DMw_bankAD':
70
+ // Symbols in memory 'DMw_bankB':
71
+ // Symbols in memory 'DMw_bankBC':
72
+ // Symbols in memory 'DMw_bankBD':
73
+ // Symbols in memory 'DMw_bankC':
74
+ // Symbols in memory 'DMw_bankCD':
75
+ // Symbols in memory 'DMw_bankD':
76
+ // Symbols in memory 'DMw_stack':
77
+ // Symbols in memory 'DMx':
78
+ // Symbols in memory 'DMx_bankA':
79
+ // Symbols in memory 'DMx_bankAB':
80
+ // Symbols in memory 'DMx_bankAC':
81
+ // Symbols in memory 'DMx_bankAD':
82
+ // Symbols in memory 'DMx_bankB':
83
+ // Symbols in memory 'DMx_bankBC':
84
+ // Symbols in memory 'DMx_bankBD':
85
+ // Symbols in memory 'DMx_bankC':
86
+ // Symbols in memory 'DMx_bankCD':
87
+ // Symbols in memory 'DMx_bankD':
88
+ // Symbols in memory 'DMx_stack':
89
+ // Symbols in memory 'PM':
90
+ _symbol _Z13kernelWrapperPPvjjjj 0x00000930
91
+ _symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000b60
92
+ _symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001100
93
+ _symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001210
94
+ _symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001b80
95
+ _symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00001fe0
96
+ _symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002020
97
+ _symbol _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000021a0
98
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002390
99
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x000023d0
100
+ _symbol _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000027a0
101
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00002990
102
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00002a10
103
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00002a80
104
+ _symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002a90
105
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002cf0
106
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002d10
107
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00002da0
108
+ _symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002ed0
109
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00003130
110
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x000031b0
111
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E 0x00003200
112
+ _symbol _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00003210
113
+ _symbol _Z14_b1638_wrapperPPv 0x00003470
114
+ _symbol _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params 0x00003490
115
+ _symbol _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj 0x000037a0
116
+ _symbol _Z13_b806_wrapperPPv 0x00003a50
117
+ _symbol _Z14_b1655_wrapperPPv 0x00003a70
118
+ _symbol _Z13_b891_wrapperPPv 0x00003aa0
119
+ _symbol _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj 0x00003ad0
120
+ _symbol _Z13_b820_wrapperPPv 0x00003e10
121
+ _symbol _Z13_b896_wrapperPPv 0x00003e40
122
+ _symbol _Z14_b1672_wrapperPPv 0x00003e70
123
+ _symbol _Z13_b886_wrapperPPv 0x00003e90
124
+ // Symbols in memory 'PMw':
125
+ // Symbols in memory 'TM4':
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/Release/3_3_reloadable23.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/Release/3_3_reloadable23.txt ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/scripts/3_3_reloadable23.bcf ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _reserved DMb 0x0 0x40000
2
+
3
+ _reserved PM 0x0 0x930 //reserved for main elf
4
+
5
+ _entry_point _Z13kernelWrapperPPvjjjj
6
+ _symbol _Z13kernelWrapperPPvjjjj 0x930
7
+
8
+ _reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
9
+ _reserved DMb 0x7ba80 0x40 //reserved for sync buffer
10
+ _stack DM_stack 0x7bac0 0x940 //stack for core
11
+ _reserved DMb 0x7c400 0x40 //reserved for main elf heap
12
+ //space for synopsys compiler at 0x7c440 0x880//heap
13
+ _reserved DMb 0x40000 0x3b280
14
+
15
+ _reserved DMb 0x7ccc0 0x3340
16
+ _reserved DMb 0x80000 0x80000 // And everything else the core can't see
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/scripts/3_3_reloadable23.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <issinit/>
3
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
4
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
5
+ <option id="llvm.lang" value="Follow file extension"/>
6
+ <option id="bridge.cfg" value="3_3_reloadable23.bcf"/>
7
+ <option id="bridge.alibs" value=" ../Release/3_3_reloadable23.o" inherit="1" cfg="Release_LLVM"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/3_3_reloadable23"/>
10
+ <option id="project.name" value="3_3_reloadable23"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable23/src/3_3_reloadable23.cc ADDED
@@ -0,0 +1,124 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+
8
+ // Declare Kernel functions and initializers
9
+ void superkernel_sigmoid1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
10
+ #include "slice_adf_wrapper.cpp"
11
+ void superkernel_sub1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
12
+ void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
13
+ #include "concat_adf_wrapper.cpp"
14
+ void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
15
+ void superkernel_tanh1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
16
+ void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
17
+
18
+ // Declare Kernel objects and external arrays
19
+
20
+
21
+ void _b1638_wrapper(void* args[])
22
+ {
23
+ superkernel_sigmoid1d(
24
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
25
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
26
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
27
+ }
28
+
29
+ void _b806_wrapper(void* args[])
30
+ {
31
+ mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
32
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
33
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
34
+ *reinterpret_cast<uint32 const(*)[7]>(args[2]));
35
+ }
36
+
37
+ void _b1655_wrapper(void* args[])
38
+ {
39
+ superkernel_sub1d(
40
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
41
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
42
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
43
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
44
+ }
45
+
46
+ void _b891_wrapper(void* args[])
47
+ {
48
+ superkernel_mul1d(
49
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
50
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
51
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
52
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
53
+ }
54
+
55
+ void _b820_wrapper(void* args[])
56
+ {
57
+ mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
58
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
59
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
60
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[2]),
61
+ *reinterpret_cast<uint32 const(*)[8]>(args[3]));
62
+ }
63
+
64
+ void _b896_wrapper(void* args[])
65
+ {
66
+ conv2d_maxpool(
67
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
68
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
69
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
70
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
71
+ }
72
+
73
+ void _b1672_wrapper(void* args[])
74
+ {
75
+ superkernel_tanh1d(
76
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
77
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
78
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
79
+ }
80
+
81
+ void _b886_wrapper(void* args[])
82
+ {
83
+ superkernel_add1d(
84
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
85
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
86
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
87
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
88
+ }
89
+
90
+ using UniformKernelFunc = void (*)(void **);
91
+
92
+ static UniformKernelFunc g_uniformKernelFuncs[8] = {
93
+ _b1638_wrapper,
94
+ _b806_wrapper,
95
+ _b1655_wrapper,
96
+ _b891_wrapper,
97
+ _b820_wrapper,
98
+ _b896_wrapper,
99
+ _b1672_wrapper,
100
+ _b886_wrapper
101
+ };
102
+
103
+ __attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
104
+ {
105
+ uint32 idx = 0;
106
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
107
+ idx += (numSyncIn > 0) ? 1 : 0;
108
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
109
+ idx += (numSyncIn > 1) ? 1 : 0;
110
+ idx += numAsyncIn;
111
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::out>(numSyncOut > 0);
112
+ idx += (numSyncOut > 0) ? 1 : 0;
113
+
114
+ (*(g_uniformKernelFuncs[kernelId]))(args);
115
+
116
+ idx = 0;
117
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
118
+ idx += (numSyncIn > 0) ? 1 : 0;
119
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
120
+ idx += (numSyncIn > 1) ? 1 : 0;
121
+ idx += numAsyncIn;
122
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::out>(numSyncOut > 0);
123
+ idx += (numSyncOut > 0) ? 1 : 0;
124
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.calltree ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:03:19 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable24 ../Release/0_0_reloadable24.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable24.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6947 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z13kernelWrapperPPvjjjj
10
+ _Z13_b853_wrapperPPv (referenced text)
11
+ _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
12
+ _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj
13
+ _Z13_b896_wrapperPPv (referenced text)
14
+ _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
15
+ _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
16
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
17
+ _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
18
+ _Z14_b1638_wrapperPPv (referenced text)
19
+ _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
20
+ _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
21
+ _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
22
+ _Z14_b1655_wrapperPPv (referenced text)
23
+ _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
24
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
25
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
26
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
27
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
28
+ _Z13_b891_wrapperPPv (referenced text)
29
+ _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
30
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
31
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
32
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
33
+ _Z14_b1672_wrapperPPv (referenced text)
34
+ _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
35
+ _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
36
+ _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
37
+ _Z13_b886_wrapperPPv (referenced text)
38
+ _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
39
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
40
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
41
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
42
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (*)
43
+
44
+
45
+ Call tree stack and functions sizes:
46
+
47
+ stack stack stack call func func function name
48
+ desc level level desc
49
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
50
+ 64 512 0 0 546 13188 _Z13kernelWrapperPPvjjjj
51
+ 0 0 1 1 32 2086 _Z13_b853_wrapperPPv
52
+ 0 0 1 2 470 2054 _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj <tail call>
53
+ 0 0 1 3 1584 1584 _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj <tail call>
54
+ 0 192 1 1 36 4714 _Z13_b896_wrapperPPv
55
+ 64 192 1 2 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
56
+ 64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
57
+ 128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
58
+ 0 0 3 4 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
59
+ 0 64 1 1 32 960 _Z14_b1638_wrapperPPv
60
+ 64 64 1 2 488 928 _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
61
+ 0 0 2 3 62 62 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
62
+ 0 0 2 3 378 378 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
63
+ 0 192 1 1 36 1378 _Z14_b1655_wrapperPPv
64
+ 64 192 1 2 602 1342 _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
65
+ 64 64 2 3 74 190 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
66
+ 0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
67
+ 0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
68
+ 128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
69
+ 0 128 1 1 36 1092 _Z13_b891_wrapperPPv
70
+ 64 128 1 2 602 1056 _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
71
+ 64 64 2 3 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
72
+ 0 0 3 4 24 24 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
73
+ 0 0 2 3 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
74
+ 0 448 1 1 32 1544 _Z14_b1672_wrapperPPv
75
+ 64 448 1 2 488 1512 _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
76
+ 0 0 2 3 62 62 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
77
+ 384 384 2 3 962 962 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
78
+ 0 192 1 1 36 1402 _Z13_b886_wrapperPPv
79
+ 64 192 1 2 602 1366 _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
80
+ 64 64 2 3 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
81
+ 0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
82
+ 0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
83
+ 128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
84
+
85
+
86
+ Maximum call level : 4
87
+ Maximum stack level: 3
88
+ Maximum stack size : 512
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.cmic2 ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.cmico ADDED
@@ -0,0 +1 @@
 
 
1
+ +Mdec
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.map ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:03:20 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable24 ../Release/0_0_reloadable24.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable24.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6947 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ Memory map for memory 'DM_stack':
9
+
10
+ Size = 1048576
11
+ Width = 8 bits
12
+ Offset = 0
13
+ Used = 2368
14
+
15
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
16
+
17
+ Memory map for memory 'DMb':
18
+
19
+ Size = 1048576
20
+ Width = 8 bits
21
+ Offset = 0
22
+ Used = 3397
23
+
24
+ 0x00000000..0x0007babf ( 506560 items) : Reserved
25
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
26
+ 0x0007c400..0x0007c43f ( 64 items) : Reserved
27
+ 0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
28
+ 0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
29
+ 0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable24.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
30
+ 0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable24.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
31
+ 0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL8core_row (Data, Local, .bss.DMb.4)
32
+ 0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
33
+ 0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable24.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
34
+ 0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable24.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter (Data, Weak, .bss.DMb.4)
35
+ 0x0007c460..0x0007c463 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL8num_iter (Data, Local, .data.DMb.4)
36
+ 0x0007c464..0x0007c467 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
37
+ 0x0007c468..0x0007c468 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
38
+ 0x0007c480..0x0007c49b ( 28 items) : ../Release/0_0_reloadable24.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
39
+
40
+ Called functions : _Z13_b853_wrapperPPv
41
+ _Z13_b896_wrapperPPv
42
+ _Z14_b1638_wrapperPPv
43
+ _Z14_b1655_wrapperPPv
44
+ _Z13_b891_wrapperPPv
45
+ _Z14_b1672_wrapperPPv
46
+ _Z13_b886_wrapperPPv
47
+
48
+ 0x0007c4c0..0x0007c4df ( 32 items) : ../Release/0_0_reloadable24.o::__const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs (Data, Local, .rodata.DMb.64)
49
+ 0x0007c500..0x0007c51f ( 32 items) : ../Release/0_0_reloadable24.o::__const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs_asymmetric (Data, Local, .rodata.DMb.64)
50
+ 0x0007c540..0x0007c57f ( 64 items) : ../Release/0_0_reloadable24.o::add1d_params (Data, Global, .bss.DMb.64)
51
+ 0x0007c580..0x0007c5bf ( 64 items) : ../Release/0_0_reloadable24.o::mul1d_params (Data, Global, .bss.DMb.64)
52
+ 0x0007c5c0..0x0007c5ff ( 64 items) : ../Release/0_0_reloadable24.o::sub1d_params (Data, Global, .bss.DMb.64)
53
+ 0x0007c600..0x0007c63f ( 64 items) : ../Release/0_0_reloadable24.o::sigmoid1d_params (Data, Global, .bss.DMb.64)
54
+ 0x0007c640..0x0007c67f ( 64 items) : ../Release/0_0_reloadable24.o::tanh1d_params (Data, Global, .bss.DMb.64)
55
+ 0x0007c680..0x0007c83f ( 448 items) : ../Release/0_0_reloadable24.o::conv2d_params (Data, Global, .bss.DMb.64)
56
+ 0x0007c840..0x0007c8bf ( 128 items) : ../Release/0_0_reloadable24.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params (Data, Weak, .bss.DMb.64)
57
+ 0x0007ccc0..0x000fffff ( 537408 items) : Reserved
58
+
59
+ Memory map for memory 'PM':
60
+
61
+ Size = 1048576
62
+ Width = 8 bits
63
+ Offset = 0
64
+ Used = 13188
65
+
66
+ 0x00000000..0x0000092f ( 2352 items) : Reserved
67
+ 0x00000930..0x00000b51 ( 546 items) : ../Release/0_0_reloadable24.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
68
+
69
+ Referenced symbols: _ZL20g_uniformKernelFuncs
70
+
71
+ 0x00000b60..0x000010f5 ( 1430 items) : ../Release/0_0_reloadable24.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
72
+ 0x00001100..0x0000120d ( 270 items) : ../Release/0_0_reloadable24.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
73
+
74
+ Referenced symbols: _ZN12me_primitive11control_rndE
75
+
76
+ 0x00001210..0x00001b79 ( 2410 items) : ../Release/0_0_reloadable24.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
77
+
78
+ Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
79
+
80
+ Referenced symbols: _ZN12me_primitive11control_rndE
81
+
82
+ 0x00001b80..0x00001db7 ( 568 items) : ../Release/0_0_reloadable24.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
83
+
84
+ Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
85
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
86
+
87
+ Referenced symbols: _ZL9curr_iter
88
+ conv2d_params
89
+ _ZN12me_primitive11control_rndE
90
+ _ZN12me_primitive11control_satE
91
+ _ZL14num_depth_iter
92
+ _ZL8num_iter
93
+ _ZL10depth_iter
94
+ _ZL11total_iters
95
+
96
+ 0x00001dc0..0x00001fd5 ( 534 items) : ../Release/0_0_reloadable24.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
97
+
98
+ Referenced symbols: _ZN12me_primitive11control_rndE
99
+
100
+ 0x00001fe0..0x0000201d ( 62 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
101
+ 0x00002020..0x00002199 ( 378 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
102
+
103
+ Referenced symbols: _ZN12me_primitive11control_rndE
104
+
105
+ 0x000021a0..0x00002387 ( 488 items) : ../Release/0_0_reloadable24.o::_Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
106
+
107
+ Called functions : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
108
+ _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
109
+
110
+ Referenced symbols: _ZL9curr_iter
111
+ _ZL8core_row
112
+ sigmoid1d_params
113
+ _ZN12me_primitive11control_rndE
114
+ _ZN12me_primitive11control_satE
115
+ _ZL11ifm1_offset
116
+ _ZL8num_iter
117
+
118
+ 0x00002390..0x000023cd ( 62 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
119
+ 0x000023d0..0x00002791 ( 962 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 384)
120
+
121
+ Referenced symbols: _ZN12me_primitive11control_rndE
122
+
123
+ 0x000027a0..0x00002987 ( 488 items) : ../Release/0_0_reloadable24.o::_Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
124
+
125
+ Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
126
+ _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
127
+
128
+ Referenced symbols: _ZL9curr_iter
129
+ _ZL8core_row
130
+ tanh1d_params
131
+ _ZN12me_primitive11control_rndE
132
+ _ZN12me_primitive11control_satE
133
+ _ZL11ifm1_offset
134
+ _ZL8num_iter
135
+
136
+ 0x00002990..0x00002a03 ( 116 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
137
+ 0x00002a10..0x00002a71 ( 98 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
138
+
139
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
140
+
141
+ 0x00002a80..0x00002a8f ( 16 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
142
+
143
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
144
+
145
+ 0x00002a90..0x00002ce9 ( 602 items) : ../Release/0_0_reloadable24.o::_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
146
+
147
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
148
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
149
+
150
+ Referenced symbols: _ZL9curr_iter
151
+ _ZL8core_row
152
+ add1d_params
153
+ _ZN12me_primitive11control_rndE
154
+ _ZN12me_primitive11control_satE
155
+ _ZL11ifm1_offset
156
+ _ZL11ifm2_offset
157
+ _ZL8num_iter
158
+
159
+ 0x00002cf0..0x00002d07 ( 24 items) : ../Release/0_0_reloadable24.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
160
+ 0x00002d10..0x00002d99 ( 138 items) : ../Release/0_0_reloadable24.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
161
+
162
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
163
+
164
+ 0x00002da0..0x00002ec3 ( 292 items) : ../Release/0_0_reloadable24.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
165
+
166
+ Referenced symbols: _ZN12me_primitive11control_rndE
167
+
168
+ 0x00002ed0..0x00003129 ( 602 items) : ../Release/0_0_reloadable24.o::_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
169
+
170
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
171
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
172
+
173
+ Referenced symbols: _ZL9curr_iter
174
+ _ZL8core_row
175
+ mul1d_params
176
+ _ZN12me_primitive11control_rndE
177
+ _ZN12me_primitive11control_satE
178
+ _ZL11ifm1_offset
179
+ _ZL11ifm2_offset
180
+ _ZL8num_iter
181
+
182
+ 0x00003130..0x000031a3 ( 116 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
183
+ 0x000031b0..0x000031f9 ( 74 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
184
+
185
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
186
+
187
+ 0x00003200..0x0000320f ( 16 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
188
+
189
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
190
+
191
+ 0x00003210..0x00003469 ( 602 items) : ../Release/0_0_reloadable24.o::_Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
192
+
193
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
194
+ _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
195
+
196
+ Referenced symbols: _ZL9curr_iter
197
+ _ZL8core_row
198
+ sub1d_params
199
+ _ZN12me_primitive11control_rndE
200
+ _ZN12me_primitive11control_satE
201
+ _ZL11ifm1_offset
202
+ _ZL11ifm2_offset
203
+ _ZL8num_iter
204
+
205
+ 0x00003470..0x00003a9f ( 1584 items) : ../Release/0_0_reloadable24.o::_Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj (Function, Weak, .text) (stack frame size = 0)
206
+
207
+ Referenced symbols: __const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs
208
+ __const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs_asymmetric
209
+ _ZN12me_primitive11control_rndE
210
+
211
+ 0x00003aa0..0x00003c75 ( 470 items) : ../Release/0_0_reloadable24.o::_ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj (Function, Weak, .text) (stack frame size = 0)
212
+
213
+ Called functions : _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj
214
+
215
+ Referenced symbols: _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter
216
+ _ZN12me_primitive11control_satE
217
+ _ZN12me_primitive11control_rndE
218
+ _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params
219
+
220
+ 0x00003c80..0x00003c9f ( 32 items) : ../Release/0_0_reloadable24.o::_Z13_b853_wrapperPPv (Function, Global, .text) (stack frame size = 0)
221
+
222
+ Called functions : _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
223
+
224
+ 0x00003ca0..0x00003cc3 ( 36 items) : ../Release/0_0_reloadable24.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
225
+
226
+ Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
227
+
228
+ 0x00003cd0..0x00003cef ( 32 items) : ../Release/0_0_reloadable24.o::_Z14_b1638_wrapperPPv (Function, Global, .text) (stack frame size = 0)
229
+
230
+ Called functions : _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
231
+
232
+ 0x00003cf0..0x00003d13 ( 36 items) : ../Release/0_0_reloadable24.o::_Z14_b1655_wrapperPPv (Function, Global, .text) (stack frame size = 0)
233
+
234
+ Called functions : _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
235
+
236
+ 0x00003d20..0x00003d43 ( 36 items) : ../Release/0_0_reloadable24.o::_Z13_b891_wrapperPPv (Function, Global, .text) (stack frame size = 0)
237
+
238
+ Called functions : _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
239
+
240
+ 0x00003d50..0x00003d6f ( 32 items) : ../Release/0_0_reloadable24.o::_Z14_b1672_wrapperPPv (Function, Global, .text) (stack frame size = 0)
241
+
242
+ Called functions : _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
243
+
244
+ 0x00003d70..0x00003d93 ( 36 items) : ../Release/0_0_reloadable24.o::_Z13_b886_wrapperPPv (Function, Global, .text) (stack frame size = 0)
245
+
246
+ Called functions : _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
247
+
248
+
249
+ External symbols:
250
+
251
+ __dso_handle = 0x0
252
+ _ctors_end = 0x0
253
+ _ctors_start = 0x0
254
+ _dtors_end = 0x0
255
+ _dtors_start = 0x0
256
+ _pc_end = 0x3d94
257
+ _pc_start = 0x930
258
+ _sp_end_DM_stack = 0x7c400
259
+ _sp_start_DM_stack = 0x7bac0
260
+
261
+ Section summary for memory 'DM_stack':
262
+
263
+ .stack File
264
+ ---------- ----------
265
+ 2368
266
+ ---------- ----------
267
+ 2368 Total
268
+
269
+ Section summary for memory 'DMb':
270
+
271
+ .bss .data .rodata File
272
+ ---------- ---------- ---------- ----------
273
+ 928 4 92 ../Release/0_0_reloadable24.o
274
+ 5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
275
+ ---------- ---------- ---------- ----------
276
+ 933 4 92 Total
277
+
278
+ Section summary for memory 'PM':
279
+
280
+ .text File
281
+ ---------- ----------
282
+ 13188 ../Release/0_0_reloadable24.o
283
+ ---------- ----------
284
+ 13188 Total
285
+
286
+ File summary:
287
+
288
+ ../Release/0_0_reloadable24.o
289
+ DMb 1024
290
+ PM 13188
291
+
292
+ me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
293
+ DMb 5
294
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.sdr ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:03:20 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable24 ../Release/0_0_reloadable24.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable24.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6947 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ // Symbols in memory 'DM_bankA':
9
+ // Symbols in memory 'DM_bankAB':
10
+ // Symbols in memory 'DM_bankAC':
11
+ // Symbols in memory 'DM_bankAD':
12
+ // Symbols in memory 'DM_bankB':
13
+ // Symbols in memory 'DM_bankBC':
14
+ // Symbols in memory 'DM_bankBD':
15
+ // Symbols in memory 'DM_bankC':
16
+ // Symbols in memory 'DM_bankCD':
17
+ // Symbols in memory 'DM_bankD':
18
+ // Symbols in memory 'DM_stack':
19
+ // Symbols in memory 'DM_test':
20
+ // Symbols in memory 'DMb':
21
+ _symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter 0x0007c45c
22
+ _symbol _ZN12me_primitive11control_satE 0x0007c464
23
+ _symbol _ZN12me_primitive11control_rndE 0x0007c468
24
+ _symbol add1d_params 0x0007c540
25
+ _symbol mul1d_params 0x0007c580
26
+ _symbol sub1d_params 0x0007c5c0
27
+ _symbol sigmoid1d_params 0x0007c600
28
+ _symbol tanh1d_params 0x0007c640
29
+ _symbol conv2d_params 0x0007c680
30
+ _symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params 0x0007c840
31
+ // Symbols in memory 'DMh':
32
+ // Symbols in memory 'DMh_bankA':
33
+ // Symbols in memory 'DMh_bankAB':
34
+ // Symbols in memory 'DMh_bankAC':
35
+ // Symbols in memory 'DMh_bankAD':
36
+ // Symbols in memory 'DMh_bankB':
37
+ // Symbols in memory 'DMh_bankBC':
38
+ // Symbols in memory 'DMh_bankBD':
39
+ // Symbols in memory 'DMh_bankC':
40
+ // Symbols in memory 'DMh_bankCD':
41
+ // Symbols in memory 'DMh_bankD':
42
+ // Symbols in memory 'DMh_stack':
43
+ // Symbols in memory 'DMs':
44
+ // Symbols in memory 'DMs_bankA':
45
+ // Symbols in memory 'DMs_bankAB':
46
+ // Symbols in memory 'DMs_bankAC':
47
+ // Symbols in memory 'DMs_bankAD':
48
+ // Symbols in memory 'DMs_bankB':
49
+ // Symbols in memory 'DMs_bankBC':
50
+ // Symbols in memory 'DMs_bankBD':
51
+ // Symbols in memory 'DMs_bankC':
52
+ // Symbols in memory 'DMs_bankCD':
53
+ // Symbols in memory 'DMs_bankD':
54
+ // Symbols in memory 'DMs_stack':
55
+ // Symbols in memory 'DMv':
56
+ // Symbols in memory 'DMv_bankA':
57
+ // Symbols in memory 'DMv_bankAB':
58
+ // Symbols in memory 'DMv_bankAC':
59
+ // Symbols in memory 'DMv_bankAD':
60
+ // Symbols in memory 'DMv_bankB':
61
+ // Symbols in memory 'DMv_bankBC':
62
+ // Symbols in memory 'DMv_bankBD':
63
+ // Symbols in memory 'DMv_bankC':
64
+ // Symbols in memory 'DMv_bankCD':
65
+ // Symbols in memory 'DMv_bankD':
66
+ // Symbols in memory 'DMv_stack':
67
+ // Symbols in memory 'DMw':
68
+ // Symbols in memory 'DMw_bankA':
69
+ // Symbols in memory 'DMw_bankAB':
70
+ // Symbols in memory 'DMw_bankAC':
71
+ // Symbols in memory 'DMw_bankAD':
72
+ // Symbols in memory 'DMw_bankB':
73
+ // Symbols in memory 'DMw_bankBC':
74
+ // Symbols in memory 'DMw_bankBD':
75
+ // Symbols in memory 'DMw_bankC':
76
+ // Symbols in memory 'DMw_bankCD':
77
+ // Symbols in memory 'DMw_bankD':
78
+ // Symbols in memory 'DMw_stack':
79
+ // Symbols in memory 'DMx':
80
+ // Symbols in memory 'DMx_bankA':
81
+ // Symbols in memory 'DMx_bankAB':
82
+ // Symbols in memory 'DMx_bankAC':
83
+ // Symbols in memory 'DMx_bankAD':
84
+ // Symbols in memory 'DMx_bankB':
85
+ // Symbols in memory 'DMx_bankBC':
86
+ // Symbols in memory 'DMx_bankBD':
87
+ // Symbols in memory 'DMx_bankC':
88
+ // Symbols in memory 'DMx_bankCD':
89
+ // Symbols in memory 'DMx_bankD':
90
+ // Symbols in memory 'DMx_stack':
91
+ // Symbols in memory 'PM':
92
+ _symbol _Z13kernelWrapperPPvjjjj 0x00000930
93
+ _symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000b60
94
+ _symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001100
95
+ _symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001210
96
+ _symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001b80
97
+ _symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00001fe0
98
+ _symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002020
99
+ _symbol _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000021a0
100
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002390
101
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x000023d0
102
+ _symbol _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000027a0
103
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00002990
104
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00002a10
105
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00002a80
106
+ _symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002a90
107
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002cf0
108
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002d10
109
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00002da0
110
+ _symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002ed0
111
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00003130
112
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x000031b0
113
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E 0x00003200
114
+ _symbol _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00003210
115
+ _symbol _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj 0x00003470
116
+ _symbol _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj 0x00003aa0
117
+ _symbol _Z13_b853_wrapperPPv 0x00003c80
118
+ _symbol _Z13_b896_wrapperPPv 0x00003ca0
119
+ _symbol _Z14_b1638_wrapperPPv 0x00003cd0
120
+ _symbol _Z14_b1655_wrapperPPv 0x00003cf0
121
+ _symbol _Z13_b891_wrapperPPv 0x00003d20
122
+ _symbol _Z14_b1672_wrapperPPv 0x00003d50
123
+ _symbol _Z13_b886_wrapperPPv 0x00003d70
124
+ // Symbols in memory 'PMw':
125
+ // Symbols in memory 'TM4':
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/Release/3_3_reloadable24.txt ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/scripts/3_3_reloadable24.bcf ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _reserved DMb 0x0 0x40000
2
+
3
+ _reserved PM 0x0 0x930 //reserved for main elf
4
+
5
+ _entry_point _Z13kernelWrapperPPvjjjj
6
+ _symbol _Z13kernelWrapperPPvjjjj 0x930
7
+
8
+ _reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
9
+ _reserved DMb 0x7ba80 0x40 //reserved for sync buffer
10
+ _stack DM_stack 0x7bac0 0x940 //stack for core
11
+ _reserved DMb 0x7c400 0x40 //reserved for main elf heap
12
+ //space for synopsys compiler at 0x7c440 0x880//heap
13
+ _reserved DMb 0x40000 0x3b280
14
+
15
+ _reserved DMb 0x7ccc0 0x3340
16
+ _reserved DMb 0x80000 0x80000 // And everything else the core can't see
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/scripts/3_3_reloadable24.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <issinit/>
3
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
4
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
5
+ <option id="llvm.lang" value="Follow file extension"/>
6
+ <option id="bridge.cfg" value="3_3_reloadable24.bcf"/>
7
+ <option id="bridge.alibs" value=" ../Release/3_3_reloadable24.o" inherit="1" cfg="Release_LLVM"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/3_3_reloadable24"/>
10
+ <option id="project.name" value="3_3_reloadable24"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable24/src/3_3_reloadable24.cc ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+
8
+ // Declare Kernel functions and initializers
9
+ #include "resize_adf_wrapper.cpp"
10
+ void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
11
+ void superkernel_sigmoid1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
12
+ void superkernel_sub1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
13
+ void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
14
+ void superkernel_tanh1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
15
+ void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
16
+
17
+ // Declare Kernel objects and external arrays
18
+
19
+
20
+ void _b853_wrapper(void* args[])
21
+ {
22
+ mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 2>(
23
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
24
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
25
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]));
26
+ }
27
+
28
+ void _b896_wrapper(void* args[])
29
+ {
30
+ conv2d_maxpool(
31
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
32
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
33
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
34
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
35
+ }
36
+
37
+ void _b1638_wrapper(void* args[])
38
+ {
39
+ superkernel_sigmoid1d(
40
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
41
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
42
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
43
+ }
44
+
45
+ void _b1655_wrapper(void* args[])
46
+ {
47
+ superkernel_sub1d(
48
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
49
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
50
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
51
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
52
+ }
53
+
54
+ void _b891_wrapper(void* args[])
55
+ {
56
+ superkernel_mul1d(
57
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
58
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
59
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
60
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
61
+ }
62
+
63
+ void _b1672_wrapper(void* args[])
64
+ {
65
+ superkernel_tanh1d(
66
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
67
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
68
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
69
+ }
70
+
71
+ void _b886_wrapper(void* args[])
72
+ {
73
+ superkernel_add1d(
74
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
75
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
76
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
77
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
78
+ }
79
+
80
+ using UniformKernelFunc = void (*)(void **);
81
+
82
+ static UniformKernelFunc g_uniformKernelFuncs[7] = {
83
+ _b853_wrapper,
84
+ _b896_wrapper,
85
+ _b1638_wrapper,
86
+ _b1655_wrapper,
87
+ _b891_wrapper,
88
+ _b1672_wrapper,
89
+ _b886_wrapper
90
+ };
91
+
92
+ __attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
93
+ {
94
+ uint32 idx = 0;
95
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
96
+ idx += (numSyncIn > 0) ? 1 : 0;
97
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
98
+ idx += (numSyncIn > 1) ? 1 : 0;
99
+ idx += numAsyncIn;
100
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::out>(numSyncOut > 0);
101
+ idx += (numSyncOut > 0) ? 1 : 0;
102
+
103
+ (*(g_uniformKernelFuncs[kernelId]))(args);
104
+
105
+ idx = 0;
106
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
107
+ idx += (numSyncIn > 0) ? 1 : 0;
108
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
109
+ idx += (numSyncIn > 1) ? 1 : 0;
110
+ idx += numAsyncIn;
111
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::out>(numSyncOut > 0);
112
+ idx += (numSyncOut > 0) ? 1 : 0;
113
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.calltree ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:04:39 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable25 ../Release/0_0_reloadable25.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable25.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork7302 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z13kernelWrapperPPvjjjj
10
+ _Z13_b806_wrapperPPv (referenced text)
11
+ _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
12
+ _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
13
+ _Z13_b906_wrapperPPv (referenced text)
14
+ _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
15
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
16
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
17
+ _Z13_b886_wrapperPPv (referenced text)
18
+ _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
19
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
20
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
21
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
22
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
23
+
24
+
25
+ Call tree stack and functions sizes:
26
+
27
+ stack stack stack call func func function name
28
+ desc level level desc
29
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
30
+ 64 256 0 0 408 4160 _Z13kernelWrapperPPvjjjj
31
+ 0 192 1 1 32 1488 _Z13_b806_wrapperPPv
32
+ 192 192 1 2 674 1456 _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj <tail call>
33
+ 0 0 2 3 782 782 _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
34
+ 0 64 1 1 32 862 _Z13_b906_wrapperPPv
35
+ 64 64 1 2 488 830 _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
36
+ 0 0 2 3 100 100 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
37
+ 0 0 2 3 242 242 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
38
+ 0 192 1 1 36 1402 _Z13_b886_wrapperPPv
39
+ 64 192 1 2 602 1366 _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
40
+ 64 64 2 3 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
41
+ 0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
42
+ 0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
43
+ 128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
44
+
45
+
46
+ Maximum call level : 4
47
+ Maximum stack level: 3
48
+ Maximum stack size : 256
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.cmic2 ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.cmico ADDED
@@ -0,0 +1 @@
 
 
1
+ +Mdec
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.map ADDED
@@ -0,0 +1,161 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:04:39 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable25 ../Release/0_0_reloadable25.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable25.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork7302 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ Memory map for memory 'DM_stack':
9
+
10
+ Size = 1048576
11
+ Width = 8 bits
12
+ Offset = 0
13
+ Used = 2368
14
+
15
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
16
+
17
+ Memory map for memory 'DMb':
18
+
19
+ Size = 1048576
20
+ Width = 8 bits
21
+ Offset = 0
22
+ Used = 2533
23
+
24
+ 0x00000000..0x0007babf ( 506560 items) : Reserved
25
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
26
+ 0x0007c400..0x0007c43f ( 64 items) : Reserved
27
+ 0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable25.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
28
+ 0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable25.o::_ZL8core_row (Data, Local, .bss.DMb.4)
29
+ 0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable25.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
30
+ 0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable25.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
31
+ 0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable25.o::_ZL8num_iter (Data, Local, .data.DMb.4)
32
+ 0x0007c454..0x0007c457 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
33
+ 0x0007c458..0x0007c458 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
34
+ 0x0007c480..0x0007c48b ( 12 items) : ../Release/0_0_reloadable25.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
35
+
36
+ Called functions : _Z13_b806_wrapperPPv
37
+ _Z13_b906_wrapperPPv
38
+ _Z13_b886_wrapperPPv
39
+
40
+ 0x0007c4c0..0x0007c4ff ( 64 items) : ../Release/0_0_reloadable25.o::add1d_params (Data, Global, .bss.DMb.64)
41
+ 0x0007c500..0x0007c53f ( 64 items) : ../Release/0_0_reloadable25.o::clip1d_params (Data, Global, .bss.DMb.64)
42
+ 0x0007ccc0..0x000fffff ( 537408 items) : Reserved
43
+
44
+ Memory map for memory 'PM':
45
+
46
+ Size = 1048576
47
+ Width = 8 bits
48
+ Offset = 0
49
+ Used = 4160
50
+
51
+ 0x00000000..0x0000092f ( 2352 items) : Reserved
52
+ 0x00000930..0x00000ac7 ( 408 items) : ../Release/0_0_reloadable25.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
53
+
54
+ Referenced symbols: _ZL20g_uniformKernelFuncs
55
+
56
+ 0x00000ad0..0x00000b33 ( 100 items) : ../Release/0_0_reloadable25.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
57
+ 0x00000b40..0x00000c31 ( 242 items) : ../Release/0_0_reloadable25.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
58
+ 0x00000c40..0x00000e27 ( 488 items) : ../Release/0_0_reloadable25.o::_Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
59
+
60
+ Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
61
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
62
+
63
+ Referenced symbols: _ZL9curr_iter
64
+ _ZL8core_row
65
+ clip1d_params
66
+ _ZN12me_primitive11control_rndE
67
+ _ZN12me_primitive11control_satE
68
+ _ZL11ifm1_offset
69
+ _ZL8num_iter
70
+
71
+ 0x00000e30..0x00001045 ( 534 items) : ../Release/0_0_reloadable25.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
72
+
73
+ Referenced symbols: _ZN12me_primitive11control_rndE
74
+
75
+ 0x00001050..0x000010c3 ( 116 items) : ../Release/0_0_reloadable25.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
76
+ 0x000010d0..0x00001131 ( 98 items) : ../Release/0_0_reloadable25.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
77
+
78
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
79
+
80
+ 0x00001140..0x0000114f ( 16 items) : ../Release/0_0_reloadable25.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
81
+
82
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
83
+
84
+ 0x00001150..0x000013a9 ( 602 items) : ../Release/0_0_reloadable25.o::_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
85
+
86
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
87
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
88
+
89
+ Referenced symbols: _ZL9curr_iter
90
+ _ZL8core_row
91
+ add1d_params
92
+ _ZN12me_primitive11control_rndE
93
+ _ZN12me_primitive11control_satE
94
+ _ZL11ifm1_offset
95
+ _ZL11ifm2_offset
96
+ _ZL8num_iter
97
+
98
+ 0x000013b0..0x000016bd ( 782 items) : ../Release/0_0_reloadable25.o::_Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params (Function, Weak, .text) (stack frame size = 0)
99
+ 0x000016c0..0x00001961 ( 674 items) : ../Release/0_0_reloadable25.o::_ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj (Function, Weak, .text) (stack frame size = 192)
100
+
101
+ Called functions : _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
102
+
103
+ 0x00001970..0x0000198f ( 32 items) : ../Release/0_0_reloadable25.o::_Z13_b806_wrapperPPv (Function, Global, .text) (stack frame size = 0)
104
+
105
+ Called functions : _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
106
+
107
+ 0x00001990..0x000019af ( 32 items) : ../Release/0_0_reloadable25.o::_Z13_b906_wrapperPPv (Function, Global, .text) (stack frame size = 0)
108
+
109
+ Called functions : _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
110
+
111
+ 0x000019b0..0x000019d3 ( 36 items) : ../Release/0_0_reloadable25.o::_Z13_b886_wrapperPPv (Function, Global, .text) (stack frame size = 0)
112
+
113
+ Called functions : _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
114
+
115
+
116
+ External symbols:
117
+
118
+ __dso_handle = 0x0
119
+ _ctors_end = 0x0
120
+ _ctors_start = 0x0
121
+ _dtors_end = 0x0
122
+ _dtors_start = 0x0
123
+ _pc_end = 0x19d4
124
+ _pc_start = 0x930
125
+ _sp_end_DM_stack = 0x7c400
126
+ _sp_start_DM_stack = 0x7bac0
127
+
128
+ Section summary for memory 'DM_stack':
129
+
130
+ .stack File
131
+ ---------- ----------
132
+ 2368
133
+ ---------- ----------
134
+ 2368 Total
135
+
136
+ Section summary for memory 'DMb':
137
+
138
+ .bss .data .rodata File
139
+ ---------- ---------- ---------- ----------
140
+ 144 4 12 ../Release/0_0_reloadable25.o
141
+ 5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
142
+ ---------- ---------- ---------- ----------
143
+ 149 4 12 Total
144
+
145
+ Section summary for memory 'PM':
146
+
147
+ .text File
148
+ ---------- ----------
149
+ 4160 ../Release/0_0_reloadable25.o
150
+ ---------- ----------
151
+ 4160 Total
152
+
153
+ File summary:
154
+
155
+ ../Release/0_0_reloadable25.o
156
+ DMb 160
157
+ PM 4160
158
+
159
+ me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
160
+ DMb 5
161
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.sdr ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:04:39 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable25 ../Release/0_0_reloadable25.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable25.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork7302 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ // Symbols in memory 'DM_bankA':
9
+ // Symbols in memory 'DM_bankAB':
10
+ // Symbols in memory 'DM_bankAC':
11
+ // Symbols in memory 'DM_bankAD':
12
+ // Symbols in memory 'DM_bankB':
13
+ // Symbols in memory 'DM_bankBC':
14
+ // Symbols in memory 'DM_bankBD':
15
+ // Symbols in memory 'DM_bankC':
16
+ // Symbols in memory 'DM_bankCD':
17
+ // Symbols in memory 'DM_bankD':
18
+ // Symbols in memory 'DM_stack':
19
+ // Symbols in memory 'DM_test':
20
+ // Symbols in memory 'DMb':
21
+ _symbol _ZN12me_primitive11control_satE 0x0007c454
22
+ _symbol _ZN12me_primitive11control_rndE 0x0007c458
23
+ _symbol add1d_params 0x0007c4c0
24
+ _symbol clip1d_params 0x0007c500
25
+ // Symbols in memory 'DMh':
26
+ // Symbols in memory 'DMh_bankA':
27
+ // Symbols in memory 'DMh_bankAB':
28
+ // Symbols in memory 'DMh_bankAC':
29
+ // Symbols in memory 'DMh_bankAD':
30
+ // Symbols in memory 'DMh_bankB':
31
+ // Symbols in memory 'DMh_bankBC':
32
+ // Symbols in memory 'DMh_bankBD':
33
+ // Symbols in memory 'DMh_bankC':
34
+ // Symbols in memory 'DMh_bankCD':
35
+ // Symbols in memory 'DMh_bankD':
36
+ // Symbols in memory 'DMh_stack':
37
+ // Symbols in memory 'DMs':
38
+ // Symbols in memory 'DMs_bankA':
39
+ // Symbols in memory 'DMs_bankAB':
40
+ // Symbols in memory 'DMs_bankAC':
41
+ // Symbols in memory 'DMs_bankAD':
42
+ // Symbols in memory 'DMs_bankB':
43
+ // Symbols in memory 'DMs_bankBC':
44
+ // Symbols in memory 'DMs_bankBD':
45
+ // Symbols in memory 'DMs_bankC':
46
+ // Symbols in memory 'DMs_bankCD':
47
+ // Symbols in memory 'DMs_bankD':
48
+ // Symbols in memory 'DMs_stack':
49
+ // Symbols in memory 'DMv':
50
+ // Symbols in memory 'DMv_bankA':
51
+ // Symbols in memory 'DMv_bankAB':
52
+ // Symbols in memory 'DMv_bankAC':
53
+ // Symbols in memory 'DMv_bankAD':
54
+ // Symbols in memory 'DMv_bankB':
55
+ // Symbols in memory 'DMv_bankBC':
56
+ // Symbols in memory 'DMv_bankBD':
57
+ // Symbols in memory 'DMv_bankC':
58
+ // Symbols in memory 'DMv_bankCD':
59
+ // Symbols in memory 'DMv_bankD':
60
+ // Symbols in memory 'DMv_stack':
61
+ // Symbols in memory 'DMw':
62
+ // Symbols in memory 'DMw_bankA':
63
+ // Symbols in memory 'DMw_bankAB':
64
+ // Symbols in memory 'DMw_bankAC':
65
+ // Symbols in memory 'DMw_bankAD':
66
+ // Symbols in memory 'DMw_bankB':
67
+ // Symbols in memory 'DMw_bankBC':
68
+ // Symbols in memory 'DMw_bankBD':
69
+ // Symbols in memory 'DMw_bankC':
70
+ // Symbols in memory 'DMw_bankCD':
71
+ // Symbols in memory 'DMw_bankD':
72
+ // Symbols in memory 'DMw_stack':
73
+ // Symbols in memory 'DMx':
74
+ // Symbols in memory 'DMx_bankA':
75
+ // Symbols in memory 'DMx_bankAB':
76
+ // Symbols in memory 'DMx_bankAC':
77
+ // Symbols in memory 'DMx_bankAD':
78
+ // Symbols in memory 'DMx_bankB':
79
+ // Symbols in memory 'DMx_bankBC':
80
+ // Symbols in memory 'DMx_bankBD':
81
+ // Symbols in memory 'DMx_bankC':
82
+ // Symbols in memory 'DMx_bankCD':
83
+ // Symbols in memory 'DMx_bankD':
84
+ // Symbols in memory 'DMx_stack':
85
+ // Symbols in memory 'PM':
86
+ _symbol _Z13kernelWrapperPPvjjjj 0x00000930
87
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00000ad0
88
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00000b40
89
+ _symbol _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00000c40
90
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00001050
91
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x000010d0
92
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00001140
93
+ _symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00001150
94
+ _symbol _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params 0x000013b0
95
+ _symbol _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj 0x000016c0
96
+ _symbol _Z13_b806_wrapperPPv 0x00001970
97
+ _symbol _Z13_b906_wrapperPPv 0x00001990
98
+ _symbol _Z13_b886_wrapperPPv 0x000019b0
99
+ // Symbols in memory 'PMw':
100
+ // Symbols in memory 'TM4':
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/Release/3_3_reloadable25.txt ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/scripts/3_3_reloadable25.bcf ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _reserved DMb 0x0 0x40000
2
+
3
+ _reserved PM 0x0 0x930 //reserved for main elf
4
+
5
+ _entry_point _Z13kernelWrapperPPvjjjj
6
+ _symbol _Z13kernelWrapperPPvjjjj 0x930
7
+
8
+ _reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
9
+ _reserved DMb 0x7ba80 0x40 //reserved for sync buffer
10
+ _stack DM_stack 0x7bac0 0x940 //stack for core
11
+ _reserved DMb 0x7c400 0x40 //reserved for main elf heap
12
+ //space for synopsys compiler at 0x7c440 0x880//heap
13
+ _reserved DMb 0x40000 0x3b280
14
+
15
+ _reserved DMb 0x7ccc0 0x3340
16
+ _reserved DMb 0x80000 0x80000 // And everything else the core can't see
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/scripts/3_3_reloadable25.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <issinit/>
3
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
4
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
5
+ <option id="llvm.lang" value="Follow file extension"/>
6
+ <option id="bridge.cfg" value="3_3_reloadable25.bcf"/>
7
+ <option id="bridge.alibs" value=" ../Release/3_3_reloadable25.o" inherit="1" cfg="Release_LLVM"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/3_3_reloadable25"/>
10
+ <option id="project.name" value="3_3_reloadable25"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable25/src/3_3_reloadable25.cc ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+
8
+ // Declare Kernel functions and initializers
9
+ #include "slice_adf_wrapper.cpp"
10
+ void superkernel_clip1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
11
+ void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
12
+
13
+ // Declare Kernel objects and external arrays
14
+
15
+
16
+ void _b806_wrapper(void* args[])
17
+ {
18
+ mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
19
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
20
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
21
+ *reinterpret_cast<uint32 const(*)[7]>(args[2]));
22
+ }
23
+
24
+ void _b906_wrapper(void* args[])
25
+ {
26
+ superkernel_clip1d(
27
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
28
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
29
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
30
+ }
31
+
32
+ void _b886_wrapper(void* args[])
33
+ {
34
+ superkernel_add1d(
35
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
36
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
37
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
38
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
39
+ }
40
+
41
+ using UniformKernelFunc = void (*)(void **);
42
+
43
+ static UniformKernelFunc g_uniformKernelFuncs[3] = {
44
+ _b806_wrapper,
45
+ _b906_wrapper,
46
+ _b886_wrapper
47
+ };
48
+
49
+ __attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
50
+ {
51
+ uint32 idx = 0;
52
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
53
+ idx += (numSyncIn > 0) ? 1 : 0;
54
+ idx += numAsyncIn;
55
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::out>(numSyncOut > 0);
56
+ idx += (numSyncOut > 0) ? 1 : 0;
57
+
58
+ (*(g_uniformKernelFuncs[kernelId]))(args);
59
+
60
+ idx = 0;
61
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
62
+ idx += (numSyncIn > 0) ? 1 : 0;
63
+ idx += numAsyncIn;
64
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::out>(numSyncOut > 0);
65
+ idx += (numSyncOut > 0) ? 1 : 0;
66
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.calltree ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:48:01 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable3 ../Release/0_0_reloadable3.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable3.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork3342 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z13kernelWrapperPPvjjjj
10
+ _Z13_b896_wrapperPPv (referenced text)
11
+ _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
12
+ _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
13
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
14
+ _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
15
+ _Z13_b901_wrapperPPv (referenced text)
16
+ _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
17
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
18
+ _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
19
+ _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
20
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E
21
+ _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
22
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
23
+ _Z13_b906_wrapperPPv (referenced text)
24
+ _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
25
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
26
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
27
+ _Z13_b881_wrapperPPv (referenced text)
28
+ _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
29
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
30
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
31
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
32
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
33
+ _Z13_b891_wrapperPPv (referenced text)
34
+ _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
35
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
36
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
37
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
38
+ _Z13_b919_wrapperPPv (referenced text)
39
+ _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
40
+ _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
41
+ _ZN12me_primitive10udiv_dstepEjjRjS0_
42
+ _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
43
+
44
+
45
+ Call tree stack and functions sizes:
46
+
47
+ stack stack stack call func func function name
48
+ desc level level desc
49
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
50
+ 64 320 0 0 390 11754 _Z13kernelWrapperPPvjjjj
51
+ 0 192 1 1 36 4714 _Z13_b896_wrapperPPv
52
+ 64 192 1 2 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
53
+ 64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
54
+ 128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
55
+ 0 0 3 4 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
56
+ 0 192 1 1 32 1252 _Z13_b901_wrapperPPv
57
+ 64 192 1 2 488 1220 _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
58
+ 64 128 2 3 62 304 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
59
+ 64 64 3 4 162 186 _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
60
+ 0 0 4 5 24 24 _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
61
+ 0 0 2 4 56 56 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E <tail call>
62
+ 128 128 2 3 114 428 _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
63
+ 0 0 3 4 314 314 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
64
+ 0 64 1 1 32 862 _Z13_b906_wrapperPPv
65
+ 64 64 1 2 488 830 _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
66
+ 0 0 2 3 100 100 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
67
+ 0 0 2 3 242 242 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
68
+ 0 256 1 1 32 1394 _Z13_b881_wrapperPPv
69
+ 64 256 1 2 488 1362 _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
70
+ 64 64 2 3 74 190 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
71
+ 0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
72
+ 64 192 2 3 150 684 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
73
+ 128 128 3 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
74
+ 0 128 1 1 36 1092 _Z13_b891_wrapperPPv
75
+ 64 128 1 2 602 1056 _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
76
+ 64 64 2 3 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
77
+ 0 0 3 4 24 24 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
78
+ 0 0 2 3 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
79
+ 0 192 1 1 36 2050 _Z13_b919_wrapperPPv
80
+ 128 192 1 2 478 2014 _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
81
+ 64 64 2 3 672 814 _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
82
+ 0 0 3 4 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
83
+ 0 0 2 3 722 722 _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
84
+
85
+
86
+ Maximum call level : 5
87
+ Maximum stack level: 4
88
+ Maximum stack size : 320
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.cmic2 ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.cmico ADDED
@@ -0,0 +1 @@
 
 
1
+ +Mdec
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.map ADDED
@@ -0,0 +1,287 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:48:02 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable3 ../Release/0_0_reloadable3.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable3.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork3342 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ Memory map for memory 'DM_stack':
9
+
10
+ Size = 1048576
11
+ Width = 8 bits
12
+ Offset = 0
13
+ Used = 2368
14
+
15
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
16
+
17
+ Memory map for memory 'DMb':
18
+
19
+ Size = 1048576
20
+ Width = 8 bits
21
+ Offset = 0
22
+ Used = 3393
23
+
24
+ 0x00000000..0x0007babf ( 506560 items) : Reserved
25
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
26
+ 0x0007c400..0x0007c43f ( 64 items) : Reserved
27
+ 0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable3.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
28
+ 0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable3.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
29
+ 0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable3.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
30
+ 0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable3.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
31
+ 0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable3.o::_ZL8core_row (Data, Local, .bss.DMb.4)
32
+ 0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable3.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
33
+ 0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable3.o::_ZL10ifmsv_size (Data, Local, .bss.DMb.4)
34
+ 0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable3.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
35
+ 0x0007c460..0x0007c463 ( 4 items) : ../Release/0_0_reloadable3.o::_ZL8num_iter (Data, Local, .data.DMb.4)
36
+ 0x0007c464..0x0007c467 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
37
+ 0x0007c468..0x0007c468 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
38
+ 0x0007c480..0x0007c497 ( 24 items) : ../Release/0_0_reloadable3.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
39
+
40
+ Called functions : _Z13_b896_wrapperPPv
41
+ _Z13_b901_wrapperPPv
42
+ _Z13_b906_wrapperPPv
43
+ _Z13_b881_wrapperPPv
44
+ _Z13_b891_wrapperPPv
45
+ _Z13_b919_wrapperPPv
46
+
47
+ 0x0007c4c0..0x0007c4ff ( 64 items) : ../Release/0_0_reloadable3.o::add1d_attribute_broadcasting_params (Data, Global, .bss.DMb.64)
48
+ 0x0007c500..0x0007c53f ( 64 items) : ../Release/0_0_reloadable3.o::mul1d_attribute_broadcasting_params (Data, Global, .bss.DMb.64)
49
+ 0x0007c540..0x0007c57f ( 64 items) : ../Release/0_0_reloadable3.o::mul1d_params (Data, Global, .bss.DMb.64)
50
+ 0x0007c580..0x0007c5bf ( 64 items) : ../Release/0_0_reloadable3.o::clip1d_params (Data, Global, .bss.DMb.64)
51
+ 0x0007c5c0..0x0007c77f ( 448 items) : ../Release/0_0_reloadable3.o::conv2d_params (Data, Global, .bss.DMb.64)
52
+ 0x0007c780..0x0007c87f ( 256 items) : ../Release/0_0_reloadable3.o::conv2d_dw_params (Data, Global, .bss.DMb.64)
53
+ 0x0007ccc0..0x000fffff ( 537408 items) : Reserved
54
+
55
+ Memory map for memory 'PM':
56
+
57
+ Size = 1048576
58
+ Width = 8 bits
59
+ Offset = 0
60
+ Used = 11754
61
+
62
+ 0x00000000..0x0000092f ( 2352 items) : Reserved
63
+ 0x00000930..0x00000ab5 ( 390 items) : ../Release/0_0_reloadable3.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
64
+
65
+ Referenced symbols: _ZL20g_uniformKernelFuncs
66
+
67
+ 0x00000ac0..0x00001055 ( 1430 items) : ../Release/0_0_reloadable3.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
68
+ 0x00001060..0x0000116d ( 270 items) : ../Release/0_0_reloadable3.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
69
+
70
+ Referenced symbols: _ZN12me_primitive11control_rndE
71
+
72
+ 0x00001170..0x00001ad9 ( 2410 items) : ../Release/0_0_reloadable3.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
73
+
74
+ Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
75
+
76
+ Referenced symbols: _ZN12me_primitive11control_rndE
77
+
78
+ 0x00001ae0..0x00001d17 ( 568 items) : ../Release/0_0_reloadable3.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
79
+
80
+ Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
81
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
82
+
83
+ Referenced symbols: _ZL9curr_iter
84
+ conv2d_params
85
+ _ZN12me_primitive11control_rndE
86
+ _ZN12me_primitive11control_satE
87
+ _ZL14num_depth_iter
88
+ _ZL8num_iter
89
+ _ZL10depth_iter
90
+ _ZL11total_iters
91
+
92
+ 0x00001d20..0x00001d37 ( 24 items) : ../Release/0_0_reloadable3.o::_ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
93
+ 0x00001d40..0x00001de1 ( 162 items) : ../Release/0_0_reloadable3.o::_ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
94
+
95
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
96
+
97
+ 0x00001df0..0x00001e27 ( 56 items) : ../Release/0_0_reloadable3.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
98
+ 0x00001e30..0x00001e6d ( 62 items) : ../Release/0_0_reloadable3.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
99
+
100
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
101
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E
102
+
103
+ 0x00001e70..0x00001fa9 ( 314 items) : ../Release/0_0_reloadable3.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
104
+
105
+ Referenced symbols: _ZN12me_primitive11control_rndE
106
+
107
+ 0x00001fb0..0x00002021 ( 114 items) : ../Release/0_0_reloadable3.o::_ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 128)
108
+
109
+ Called functions : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
110
+
111
+ 0x00002030..0x00002217 ( 488 items) : ../Release/0_0_reloadable3.o::_Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
112
+
113
+ Called functions : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
114
+ _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
115
+
116
+ Referenced symbols: _ZL9curr_iter
117
+ _ZL8core_row
118
+ add1d_attribute_broadcasting_params
119
+ _ZN12me_primitive11control_rndE
120
+ _ZN12me_primitive11control_satE
121
+ _ZL11ifm1_offset
122
+ _ZL8num_iter
123
+
124
+ 0x00002220..0x00002283 ( 100 items) : ../Release/0_0_reloadable3.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
125
+ 0x00002290..0x00002381 ( 242 items) : ../Release/0_0_reloadable3.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
126
+ 0x00002390..0x00002577 ( 488 items) : ../Release/0_0_reloadable3.o::_Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
127
+
128
+ Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
129
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
130
+
131
+ Referenced symbols: _ZL9curr_iter
132
+ _ZL8core_row
133
+ clip1d_params
134
+ _ZN12me_primitive11control_rndE
135
+ _ZN12me_primitive11control_satE
136
+ _ZL11ifm1_offset
137
+ _ZL8num_iter
138
+
139
+ 0x00002580..0x000025f3 ( 116 items) : ../Release/0_0_reloadable3.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
140
+ 0x00002600..0x00002649 ( 74 items) : ../Release/0_0_reloadable3.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
141
+
142
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
143
+
144
+ 0x00002650..0x00002865 ( 534 items) : ../Release/0_0_reloadable3.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
145
+
146
+ Referenced symbols: _ZN12me_primitive11control_rndE
147
+
148
+ 0x00002870..0x00002905 ( 150 items) : ../Release/0_0_reloadable3.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 64)
149
+
150
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
151
+
152
+ 0x00002910..0x00002af7 ( 488 items) : ../Release/0_0_reloadable3.o::_Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
153
+
154
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
155
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
156
+
157
+ Referenced symbols: _ZL9curr_iter
158
+ _ZL8core_row
159
+ mul1d_attribute_broadcasting_params
160
+ _ZN12me_primitive11control_rndE
161
+ _ZN12me_primitive11control_satE
162
+ _ZL11ifm1_offset
163
+ _ZL8num_iter
164
+
165
+ 0x00002b00..0x00002b17 ( 24 items) : ../Release/0_0_reloadable3.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
166
+ 0x00002b20..0x00002ba9 ( 138 items) : ../Release/0_0_reloadable3.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
167
+
168
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
169
+
170
+ 0x00002bb0..0x00002cd3 ( 292 items) : ../Release/0_0_reloadable3.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
171
+
172
+ Referenced symbols: _ZN12me_primitive11control_rndE
173
+
174
+ 0x00002ce0..0x00002f39 ( 602 items) : ../Release/0_0_reloadable3.o::_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
175
+
176
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
177
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
178
+
179
+ Referenced symbols: _ZL9curr_iter
180
+ _ZL8core_row
181
+ mul1d_params
182
+ _ZN12me_primitive11control_rndE
183
+ _ZN12me_primitive11control_satE
184
+ _ZL11ifm1_offset
185
+ _ZL11ifm2_offset
186
+ _ZL8num_iter
187
+
188
+ 0x00002f40..0x000031df ( 672 items) : ../Release/0_0_reloadable3.o::_ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh (Function, Local, .text) (stack frame size = 64)
189
+
190
+ Called functions : _ZN12me_primitive10udiv_dstepEjjRjS0_
191
+
192
+ Referenced symbols: conv2d_dw_params
193
+ _ZN12me_primitive11control_rndE
194
+
195
+ 0x000031e0..0x000034b1 ( 722 items) : ../Release/0_0_reloadable3.o::_Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params (Function, Weak, .text) (stack frame size = 0)
196
+
197
+ Referenced symbols: _ZN12me_primitive11control_rndE
198
+
199
+ 0x000034c0..0x0000369d ( 478 items) : ../Release/0_0_reloadable3.o::_Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 128)
200
+
201
+ Called functions : _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
202
+ _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
203
+
204
+ Referenced symbols: _ZL9curr_iter
205
+ _ZL8core_row
206
+ _ZN12me_primitive11control_rndE
207
+ _ZN12me_primitive11control_satE
208
+ _ZL8num_iter
209
+ _ZL10ifmsv_size
210
+ conv2d_dw_params
211
+
212
+ 0x000036a0..0x000036c3 ( 36 items) : ../Release/0_0_reloadable3.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
213
+
214
+ Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
215
+
216
+ 0x000036d0..0x000036ef ( 32 items) : ../Release/0_0_reloadable3.o::_Z13_b901_wrapperPPv (Function, Global, .text) (stack frame size = 0)
217
+
218
+ Called functions : _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
219
+
220
+ 0x000036f0..0x0000370f ( 32 items) : ../Release/0_0_reloadable3.o::_Z13_b906_wrapperPPv (Function, Global, .text) (stack frame size = 0)
221
+
222
+ Called functions : _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
223
+
224
+ 0x00003710..0x0000372f ( 32 items) : ../Release/0_0_reloadable3.o::_Z13_b881_wrapperPPv (Function, Global, .text) (stack frame size = 0)
225
+
226
+ Called functions : _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
227
+
228
+ 0x00003730..0x00003753 ( 36 items) : ../Release/0_0_reloadable3.o::_Z13_b891_wrapperPPv (Function, Global, .text) (stack frame size = 0)
229
+
230
+ Called functions : _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
231
+
232
+ 0x00003760..0x00003783 ( 36 items) : ../Release/0_0_reloadable3.o::_Z13_b919_wrapperPPv (Function, Global, .text) (stack frame size = 0)
233
+
234
+ Called functions : _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
235
+
236
+ 0x00003790..0x0000381d ( 142 items) : me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive10udiv_dstepEjjRjS0_ (Function, Global, .text) (stack frame size = 0)
237
+
238
+ External symbols:
239
+
240
+ __dso_handle = 0x0
241
+ _ctors_end = 0x0
242
+ _ctors_start = 0x0
243
+ _dtors_end = 0x0
244
+ _dtors_start = 0x0
245
+ _pc_end = 0x381e
246
+ _pc_start = 0x930
247
+ _sp_end_DM_stack = 0x7c400
248
+ _sp_start_DM_stack = 0x7bac0
249
+
250
+ Section summary for memory 'DM_stack':
251
+
252
+ .stack File
253
+ ---------- ----------
254
+ 2368
255
+ ---------- ----------
256
+ 2368 Total
257
+
258
+ Section summary for memory 'DMb':
259
+
260
+ .bss .data .rodata File
261
+ ---------- ---------- ---------- ----------
262
+ 992 4 24 ../Release/0_0_reloadable3.o
263
+ 5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
264
+ ---------- ---------- ---------- ----------
265
+ 997 4 24 Total
266
+
267
+ Section summary for memory 'PM':
268
+
269
+ .text File
270
+ ---------- ----------
271
+ 11612 ../Release/0_0_reloadable3.o
272
+ 142 me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
273
+ ---------- ----------
274
+ 11754 Total
275
+
276
+ File summary:
277
+
278
+ ../Release/0_0_reloadable3.o
279
+ DMb 1020
280
+ PM 11612
281
+
282
+ me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
283
+ DMb 5
284
+
285
+ me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
286
+ PM 142
287
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.sdr ADDED
@@ -0,0 +1,123 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:48:02 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable3 ../Release/0_0_reloadable3.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable3.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork3342 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ // Symbols in memory 'DM_bankA':
9
+ // Symbols in memory 'DM_bankAB':
10
+ // Symbols in memory 'DM_bankAC':
11
+ // Symbols in memory 'DM_bankAD':
12
+ // Symbols in memory 'DM_bankB':
13
+ // Symbols in memory 'DM_bankBC':
14
+ // Symbols in memory 'DM_bankBD':
15
+ // Symbols in memory 'DM_bankC':
16
+ // Symbols in memory 'DM_bankCD':
17
+ // Symbols in memory 'DM_bankD':
18
+ // Symbols in memory 'DM_stack':
19
+ // Symbols in memory 'DM_test':
20
+ // Symbols in memory 'DMb':
21
+ _symbol _ZN12me_primitive11control_satE 0x0007c464
22
+ _symbol _ZN12me_primitive11control_rndE 0x0007c468
23
+ _symbol add1d_attribute_broadcasting_params 0x0007c4c0
24
+ _symbol mul1d_attribute_broadcasting_params 0x0007c500
25
+ _symbol mul1d_params 0x0007c540
26
+ _symbol clip1d_params 0x0007c580
27
+ _symbol conv2d_params 0x0007c5c0
28
+ _symbol conv2d_dw_params 0x0007c780
29
+ // Symbols in memory 'DMh':
30
+ // Symbols in memory 'DMh_bankA':
31
+ // Symbols in memory 'DMh_bankAB':
32
+ // Symbols in memory 'DMh_bankAC':
33
+ // Symbols in memory 'DMh_bankAD':
34
+ // Symbols in memory 'DMh_bankB':
35
+ // Symbols in memory 'DMh_bankBC':
36
+ // Symbols in memory 'DMh_bankBD':
37
+ // Symbols in memory 'DMh_bankC':
38
+ // Symbols in memory 'DMh_bankCD':
39
+ // Symbols in memory 'DMh_bankD':
40
+ // Symbols in memory 'DMh_stack':
41
+ // Symbols in memory 'DMs':
42
+ // Symbols in memory 'DMs_bankA':
43
+ // Symbols in memory 'DMs_bankAB':
44
+ // Symbols in memory 'DMs_bankAC':
45
+ // Symbols in memory 'DMs_bankAD':
46
+ // Symbols in memory 'DMs_bankB':
47
+ // Symbols in memory 'DMs_bankBC':
48
+ // Symbols in memory 'DMs_bankBD':
49
+ // Symbols in memory 'DMs_bankC':
50
+ // Symbols in memory 'DMs_bankCD':
51
+ // Symbols in memory 'DMs_bankD':
52
+ // Symbols in memory 'DMs_stack':
53
+ // Symbols in memory 'DMv':
54
+ // Symbols in memory 'DMv_bankA':
55
+ // Symbols in memory 'DMv_bankAB':
56
+ // Symbols in memory 'DMv_bankAC':
57
+ // Symbols in memory 'DMv_bankAD':
58
+ // Symbols in memory 'DMv_bankB':
59
+ // Symbols in memory 'DMv_bankBC':
60
+ // Symbols in memory 'DMv_bankBD':
61
+ // Symbols in memory 'DMv_bankC':
62
+ // Symbols in memory 'DMv_bankCD':
63
+ // Symbols in memory 'DMv_bankD':
64
+ // Symbols in memory 'DMv_stack':
65
+ // Symbols in memory 'DMw':
66
+ // Symbols in memory 'DMw_bankA':
67
+ // Symbols in memory 'DMw_bankAB':
68
+ // Symbols in memory 'DMw_bankAC':
69
+ // Symbols in memory 'DMw_bankAD':
70
+ // Symbols in memory 'DMw_bankB':
71
+ // Symbols in memory 'DMw_bankBC':
72
+ // Symbols in memory 'DMw_bankBD':
73
+ // Symbols in memory 'DMw_bankC':
74
+ // Symbols in memory 'DMw_bankCD':
75
+ // Symbols in memory 'DMw_bankD':
76
+ // Symbols in memory 'DMw_stack':
77
+ // Symbols in memory 'DMx':
78
+ // Symbols in memory 'DMx_bankA':
79
+ // Symbols in memory 'DMx_bankAB':
80
+ // Symbols in memory 'DMx_bankAC':
81
+ // Symbols in memory 'DMx_bankAD':
82
+ // Symbols in memory 'DMx_bankB':
83
+ // Symbols in memory 'DMx_bankBC':
84
+ // Symbols in memory 'DMx_bankBD':
85
+ // Symbols in memory 'DMx_bankC':
86
+ // Symbols in memory 'DMx_bankCD':
87
+ // Symbols in memory 'DMx_bankD':
88
+ // Symbols in memory 'DMx_stack':
89
+ // Symbols in memory 'PM':
90
+ _symbol _Z13kernelWrapperPPvjjjj 0x00000930
91
+ _symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000ac0
92
+ _symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001060
93
+ _symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001170
94
+ _symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001ae0
95
+ _symbol _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E 0x00001d20
96
+ _symbol _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv 0x00001d40
97
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E 0x00001df0
98
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00001e30
99
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00001e70
100
+ _symbol _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E 0x00001fb0
101
+ _symbol _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002030
102
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002220
103
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002290
104
+ _symbol _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002390
105
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00002580
106
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002600
107
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E 0x00002870
108
+ _symbol _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002910
109
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002b00
110
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002b20
111
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00002bb0
112
+ _symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002ce0
113
+ _symbol _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params 0x000031e0
114
+ _symbol _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000034c0
115
+ _symbol _Z13_b896_wrapperPPv 0x000036a0
116
+ _symbol _Z13_b901_wrapperPPv 0x000036d0
117
+ _symbol _Z13_b906_wrapperPPv 0x000036f0
118
+ _symbol _Z13_b881_wrapperPPv 0x00003710
119
+ _symbol _Z13_b891_wrapperPPv 0x00003730
120
+ _symbol _Z13_b919_wrapperPPv 0x00003760
121
+ _symbol _ZN12me_primitive10udiv_dstepEjjRjS0_ 0x00003790
122
+ // Symbols in memory 'PMw':
123
+ // Symbols in memory 'TM4':
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/Release/3_3_reloadable3.txt ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/scripts/3_3_reloadable3.bcf ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _reserved DMb 0x0 0x40000
2
+
3
+ _reserved PM 0x0 0x930 //reserved for main elf
4
+
5
+ _entry_point _Z13kernelWrapperPPvjjjj
6
+ _symbol _Z13kernelWrapperPPvjjjj 0x930
7
+
8
+ _reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
9
+ _reserved DMb 0x7ba80 0x40 //reserved for sync buffer
10
+ _stack DM_stack 0x7bac0 0x940 //stack for core
11
+ _reserved DMb 0x7c400 0x40 //reserved for main elf heap
12
+ //space for synopsys compiler at 0x7c440 0x880//heap
13
+ _reserved DMb 0x40000 0x3b280
14
+
15
+ _reserved DMb 0x7ccc0 0x3340
16
+ _reserved DMb 0x80000 0x80000 // And everything else the core can't see
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/scripts/3_3_reloadable3.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <issinit/>
3
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
4
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
5
+ <option id="llvm.lang" value="Follow file extension"/>
6
+ <option id="bridge.cfg" value="3_3_reloadable3.bcf"/>
7
+ <option id="bridge.alibs" value=" ../Release/3_3_reloadable3.o" inherit="1" cfg="Release_LLVM"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/3_3_reloadable3"/>
10
+ <option id="project.name" value="3_3_reloadable3"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable3/src/3_3_reloadable3.cc ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+
8
+ // Declare Kernel functions and initializers
9
+ void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
10
+ void superkernel_add1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
11
+ void superkernel_clip1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
12
+ void superkernel_mul1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
13
+ void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
14
+ void superkernel_conv2d_dwc(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
15
+
16
+ // Declare Kernel objects and external arrays
17
+
18
+
19
+ void _b896_wrapper(void* args[])
20
+ {
21
+ conv2d_maxpool(
22
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
23
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
24
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
25
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
26
+ }
27
+
28
+ void _b901_wrapper(void* args[])
29
+ {
30
+ superkernel_add1d_attribute_broadcasting(
31
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
32
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
33
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
34
+ }
35
+
36
+ void _b906_wrapper(void* args[])
37
+ {
38
+ superkernel_clip1d(
39
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
40
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
41
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
42
+ }
43
+
44
+ void _b881_wrapper(void* args[])
45
+ {
46
+ superkernel_mul1d_attribute_broadcasting(
47
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
48
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
49
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
50
+ }
51
+
52
+ void _b891_wrapper(void* args[])
53
+ {
54
+ superkernel_mul1d(
55
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
56
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
57
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
58
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
59
+ }
60
+
61
+ void _b919_wrapper(void* args[])
62
+ {
63
+ superkernel_conv2d_dwc(
64
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
65
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
66
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
67
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
68
+ }
69
+
70
+ using UniformKernelFunc = void (*)(void **);
71
+
72
+ static UniformKernelFunc g_uniformKernelFuncs[6] = {
73
+ _b896_wrapper,
74
+ _b901_wrapper,
75
+ _b906_wrapper,
76
+ _b881_wrapper,
77
+ _b891_wrapper,
78
+ _b919_wrapper
79
+ };
80
+
81
+ __attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
82
+ {
83
+ uint32 idx = 0;
84
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
85
+ idx += (numSyncIn > 0) ? 1 : 0;
86
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
87
+ idx += (numSyncIn > 1) ? 1 : 0;
88
+ idx += numAsyncIn;
89
+
90
+ (*(g_uniformKernelFuncs[kernelId]))(args);
91
+
92
+ idx = 0;
93
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
94
+ idx += (numSyncIn > 0) ? 1 : 0;
95
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
96
+ idx += (numSyncIn > 1) ? 1 : 0;
97
+ idx += numAsyncIn;
98
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable4/Release/3_3_reloadable4.calltree ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:46:39 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable2 ../Release/0_0_reloadable2.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable2.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1731 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z13kernelWrapperPPvjjjj
10
+ _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
11
+ _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv
12
+ _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t
13
+ _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E
14
+ _ZN12me_primitive10udiv_dstepEjjRjS0_
15
+ _ZN12me_primitive10udiv_dstepEjjRjS0_ (*)
16
+ int32_to_float32
17
+ _ZL28normalizeRoundAndPackFloat32iij
18
+ _ZL19roundAndPackFloat32iij
19
+ float32_add
20
+ _ZL14addFloat32Sigsjji
21
+ _ZL19propagateFloat32NaNjj
22
+ _ZL19roundAndPackFloat32iij (*)
23
+ _ZL14subFloat32Sigsjji
24
+ _ZL19propagateFloat32NaNjj (*)
25
+ _ZL28normalizeRoundAndPackFloat32iij (*)
26
+
27
+
28
+ Call tree stack and functions sizes:
29
+
30
+ stack stack stack call func func function name
31
+ desc level level desc
32
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
33
+ 64 448 0 0 220 10058 _Z13kernelWrapperPPvjjjj
34
+ 128 384 1 1 2676 9838 _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
35
+ 64 64 2 2 1588 1588 _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv
36
+ 0 0 2 2 670 670 _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t
37
+ 256 256 2 2 2680 2822 _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E
38
+ 0 0 3 3 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
39
+ 0 0 2 2 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
40
+ 0 0 2 2 114 530 int32_to_float32
41
+ 0 0 2 3 24 416 _ZL28normalizeRoundAndPackFloat32iij <tail call>
42
+ 0 0 2 4 392 392 _ZL19roundAndPackFloat32iij <tail call>
43
+ 0 0 2 2 64 1968 float32_add
44
+ 0 0 3 3 624 1128 _ZL14addFloat32Sigsjji
45
+ 0 0 4 4 112 112 _ZL19propagateFloat32NaNjj
46
+ 0 0 3 4 392 392 _ZL19roundAndPackFloat32iij <tail call>
47
+ 0 0 2 3 752 1280 _ZL14subFloat32Sigsjji <tail call>
48
+ 0 0 3 4 112 112 _ZL19propagateFloat32NaNjj
49
+ 0 0 2 4 24 416 _ZL28normalizeRoundAndPackFloat32iij <tail call> (*)
50
+
51
+
52
+ Maximum call level : 4
53
+ Maximum stack level: 4
54
+ Maximum stack size : 448
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/3_3_reloadable4/Release/3_3_reloadable4.cmic2 ADDED
The diff for this file is too large to render. See raw diff