iswaalex commited on
Commit
728a4e7
·
verified ·
1 Parent(s): b39425e

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/Release/0_0.srv +0 -0
  2. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/Release/0_0.txt +405 -0
  3. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_110.bin +3 -0
  4. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_111.bin +3 -0
  5. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_112.bin +3 -0
  6. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_114.bin +3 -0
  7. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_115.bin +3 -0
  8. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_116.bin +3 -0
  9. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_117.bin +3 -0
  10. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/scripts/0_0.bcf +20 -0
  11. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/scripts/0_0.prx +13 -0
  12. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/src/0_0.cc +90 -0
  13. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/timestamped_log/0_0.log +59 -0
  14. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/0_0_reloadable0.log +0 -0
  15. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.# +2 -0
  16. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.## +2 -0
  17. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.calltree +98 -0
  18. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.cmic2 +0 -0
  19. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.cmico +1 -0
  20. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.lst +0 -0
  21. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.map +295 -0
  22. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.o.lst +0 -0
  23. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.sdr +129 -0
  24. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.srv +0 -0
  25. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.txt +0 -0
  26. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/scripts/0_0_reloadable0.bcf +16 -0
  27. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/scripts/0_0_reloadable0.prx +13 -0
  28. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/src/0_0_reloadable0.cc +112 -0
  29. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/timestamped_log/0_0_reloadable0.log +0 -0
  30. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/xlopt.log +434 -0
  31. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/0_0_reloadable1.log +0 -0
  32. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.# +2 -0
  33. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.## +2 -0
  34. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.calltree +64 -0
  35. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.cmic2 +0 -0
  36. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.cmico +1 -0
  37. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.lst +0 -0
  38. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.map +217 -0
  39. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.o.lst +0 -0
  40. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.sdr +107 -0
  41. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.srv +0 -0
  42. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.txt +0 -0
  43. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/scripts/0_0_reloadable1.bcf +16 -0
  44. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/scripts/0_0_reloadable1.prx +13 -0
  45. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/src/0_0_reloadable1.cc +69 -0
  46. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/timestamped_log/0_0_reloadable1.log +0 -0
  47. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/xlopt.log +402 -0
  48. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable10/Release/0_0_reloadable10.calltree +54 -0
  49. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable10/Release/0_0_reloadable10.cmic2 +0 -0
  50. segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable10/Release/0_0_reloadable10.cmico +1 -0
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/Release/0_0.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/Release/0_0.txt ADDED
@@ -0,0 +1,405 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Contents of the .debug_line section:
2
+
3
+ CU: 0_0/src/0_0.cc:
4
+ File name Line number Starting address View Stmt
5
+
6
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
7
+ tile_control.h 288 0x540 x
8
+ tile_control.h 292 0x540 1
9
+ tile_control.h 292 0x540 2
10
+ tile_control.h 278 0x550
11
+ tile_control.h 292 0x550 1 x
12
+ tile_control.h 292 0x556
13
+ tile_control.h 292 0x55c
14
+ tile_control.h 278 0x562
15
+ tile_control.h 278 0x562 1
16
+ tile_control.h 292 0x570
17
+ tile_control.h 292 0x574
18
+ tile_control.h 278 0x5b0 x
19
+ tile_control.h 278 0x5c0
20
+ tile_control.h 278 0x5c0 1
21
+ tile_control.h 278 0x5d0
22
+ tile_control.h 278 0x5d0 1
23
+ tile_control.h 293 0x5e0 x
24
+
25
+ 0_0/src/0_0.cc:
26
+ 0_0.cc 12 0xe0
27
+ 0_0.cc 12 0xe0 1 x
28
+
29
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
30
+ tile_control.h 147 0xea
31
+ tile_control.h 147 0xea 1
32
+
33
+ 0_0/src/0_0.cc:
34
+ 0_0.cc 49 0xea 2
35
+ 0_0.cc 50 0xea 3
36
+ 0_0.cc 59 0xea 4
37
+ 0_0.cc 59 0xea 5
38
+ 0_0.cc 63 0xea 6
39
+ 0_0.cc 64 0xea 7
40
+ 0_0.cc 67 0xea 8
41
+
42
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
43
+ tile_control.h 278 0xf4
44
+ tile_control.h 278 0xf4 1
45
+ tile_control.h 278 0xf4 2
46
+
47
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
48
+ io_buffer_compiler.h 566 0xf4 3
49
+ io_buffer_compiler.h 567 0xf4 4
50
+ io_buffer_compiler.h 564 0x102
51
+ io_buffer_compiler.h 565 0x102 1
52
+ io_buffer_compiler.h 572 0x102 2
53
+
54
+ 0_0/src/0_0.cc:
55
+ 0_0.cc 19 0x102 3
56
+
57
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
58
+ tile_control.h 278 0x110 x
59
+ tile_control.h 278 0x114
60
+
61
+ 0_0/src/0_0.cc:
62
+ 0_0.cc 19 0x11e x
63
+
64
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
65
+ io_buffer_compiler.h 566 0x122
66
+
67
+ 0_0/src/0_0.cc:
68
+ 0_0.cc 29 0x122 1
69
+
70
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
71
+ io_buffer_compiler.h 564 0x134 x
72
+ io_buffer_compiler.h 565 0x138 x
73
+ io_buffer_compiler.h 565 0x13c
74
+ io_buffer_compiler.h 567 0x140 x
75
+ io_buffer_compiler.h 567 0x144
76
+ io_buffer_compiler.h 566 0x148 x
77
+ io_buffer_compiler.h 564 0x14c x
78
+ io_buffer_compiler.h 565 0x150 x
79
+ io_buffer_compiler.h 565 0x154
80
+ io_buffer_compiler.h 567 0x158 x
81
+ io_buffer_compiler.h 567 0x15c
82
+ io_buffer_compiler.h 566 0x160 x
83
+ io_buffer_compiler.h 564 0x164 x
84
+ io_buffer_compiler.h 565 0x168 x
85
+ io_buffer_compiler.h 565 0x16c
86
+ io_buffer_compiler.h 567 0x170 x
87
+ io_buffer_compiler.h 567 0x174
88
+ io_buffer_compiler.h 566 0x178 x
89
+ io_buffer_compiler.h 564 0x17c x
90
+ io_buffer_compiler.h 565 0x180 x
91
+ io_buffer_compiler.h 565 0x184
92
+ io_buffer_compiler.h 567 0x188 x
93
+ io_buffer_compiler.h 567 0x18c
94
+ io_buffer_compiler.h 566 0x190 x
95
+
96
+ 0_0/src/0_0.cc:
97
+ 0_0.cc 29 0x1a0 x
98
+ 0_0.cc 37 0x1a0 1 x
99
+ 0_0.cc 30 0x1aa x
100
+ 0_0.cc 37 0x1aa 1
101
+ 0_0.cc 31 0x1b4 x
102
+ 0_0.cc 32 0x1b8 x
103
+ 0_0.cc 33 0x1bc x
104
+
105
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
106
+ io_buffer_compiler.h 572 0x1c0
107
+
108
+ 0_0/src/0_0.cc:
109
+ 0_0.cc 40 0x1c0 1
110
+ 0_0.cc 40 0x1c0 2
111
+
112
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
113
+ io_buffer_compiler.h 572 0x1c8
114
+ io_buffer_compiler.h 575 0x1c8 1
115
+
116
+ 0_0/src/0_0.cc:
117
+ 0_0.cc 58 0x1c8 2
118
+
119
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
120
+ io_buffer_compiler.h 575 0x1ce
121
+
122
+ 0_0/src/0_0.cc:
123
+ 0_0.cc 41 0x1d6
124
+ 0_0.cc 37 0x1e0 x
125
+ 0_0.cc 42 0x1e0 1
126
+ 0_0.cc 43 0x1e0 2
127
+
128
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
129
+ io_buffer_compiler.h 572 0x1f0 x
130
+
131
+ 0_0/src/0_0.cc:
132
+ 0_0.cc 40 0x1f0 1 x
133
+ 0_0.cc 40 0x1f0 2 x
134
+ 0_0.cc 42 0x1f0 3 x
135
+ 0_0.cc 40 0x1fa
136
+ 0_0.cc 43 0x1fa 1 x
137
+ 0_0.cc 40 0x200 x
138
+ 0_0.cc 40 0x200 1 x
139
+ 0_0.cc 40 0x204
140
+
141
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
142
+ io_buffer_compiler.h 573 0x20e x
143
+ io_buffer_compiler.h 573 0x214
144
+ io_buffer_compiler.h 575 0x218 x
145
+ io_buffer_compiler.h 574 0x220 x
146
+ io_buffer_compiler.h 574 0x230
147
+
148
+ 0_0/src/0_0.cc:
149
+ 0_0.cc 41 0x240
150
+ 0_0.cc 41 0x250 x
151
+ 0_0.cc 70 0x260
152
+ 0_0.cc 50 0x26a
153
+ 0_0.cc 49 0x270
154
+ 0_0.cc 49 0x270 1 x
155
+ 0_0.cc 50 0x270 2
156
+ 0_0.cc 49 0x27a
157
+ 0_0.cc 50 0x27a 1 x
158
+ 0_0.cc 49 0x280 x
159
+ 0_0.cc 50 0x280 1
160
+ 0_0.cc 50 0x286 x
161
+ 0_0.cc 52 0x298 x
162
+ 0_0.cc 58 0x2a0 x
163
+ 0_0.cc 59 0x2a4 x
164
+ 0_0.cc 59 0x2a8
165
+ 0_0.cc 59 0x2a8 1
166
+ 0_0.cc 60 0x2a8 2
167
+ 0_0.cc 63 0x2a8 3
168
+ 0_0.cc 64 0x2a8 4
169
+ 0_0.cc 65 0x2a8 5
170
+ 0_0.cc 67 0x2a8 6
171
+ 0_0.cc 59 0x2b0
172
+ 0_0.cc 59 0x2b4
173
+ 0_0.cc 59 0x2ba
174
+ 0_0.cc 59 0x2c0
175
+ 0_0.cc 59 0x2c4
176
+ 0_0.cc 60 0x2d0
177
+ 0_0.cc 60 0x2d0 1
178
+
179
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
180
+ tile_control.h 147 0x2d6
181
+
182
+ 0_0/src/0_0.cc:
183
+ 0_0.cc 60 0x2d6 1 x
184
+
185
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
186
+ tile_control.h 147 0x2e0
187
+ tile_control.h 147 0x2e6
188
+ tile_control.h 260 0x2e6 1
189
+ tile_control.h 440 0x2ec
190
+
191
+ 0_0/src/0_0.cc:
192
+ 0_0.cc 60 0x2f8
193
+ 0_0.cc 61 0x2fc x
194
+ 0_0.cc 63 0x300 x
195
+ 0_0.cc 63 0x304
196
+ 0_0.cc 63 0x308
197
+
198
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
199
+ tile_control.h 147 0x318 x
200
+ tile_control.h 147 0x31c
201
+ tile_control.h 147 0x320
202
+ tile_control.h 147 0x324
203
+ tile_control.h 147 0x328
204
+ tile_control.h 260 0x328 1
205
+ tile_control.h 147 0x330
206
+ tile_control.h 260 0x330 1 x
207
+ tile_control.h 440 0x340 x
208
+ tile_control.h 440 0x344
209
+ tile_control.h 440 0x344 1
210
+
211
+ 0_0/src/0_0.cc:
212
+ 0_0.cc 63 0x354
213
+ 0_0.cc 64 0x358 x
214
+ 0_0.cc 64 0x35c
215
+ 0_0.cc 64 0x360
216
+ 0_0.cc 64 0x364
217
+ 0_0.cc 40 0x36e
218
+ 0_0.cc 64 0x372
219
+ 0_0.cc 65 0x380
220
+ 0_0.cc 65 0x380 1
221
+ 0_0.cc 65 0x380 2
222
+ 0_0.cc 70 0x380 3
223
+ 0_0.cc 40 0x38a
224
+ 0_0.cc 65 0x38a 1 x
225
+ 0_0.cc 65 0x39e
226
+ 0_0.cc 65 0x3a2
227
+ 0_0.cc 66 0x3a6 x
228
+ 0_0.cc 67 0x3aa
229
+ 0_0.cc 67 0x3aa 1 x
230
+ 0_0.cc 67 0x3b4
231
+ 0_0.cc 67 0x3b4 1
232
+ 0_0.cc 67 0x3be
233
+ 0_0.cc 67 0x3be 1
234
+ 0_0.cc 70 0x3e0 x
235
+ 0_0.cc 70 0x3e4
236
+ 0_0.cc 67 0x3f2
237
+ 0_0.cc 67 0x3f2 1
238
+ 0_0.cc 72 0x3f2 2
239
+ 0_0.cc 72 0x3f2 3
240
+ 0_0.cc 70 0x3fa
241
+ 0_0.cc 70 0x40a
242
+ 0_0.cc 70 0x41a
243
+ 0_0.cc 70 0x41a 1
244
+ 0_0.cc 71 0x436 x
245
+ 0_0.cc 67 0x450 x
246
+ 0_0.cc 72 0x450 1
247
+ 0_0.cc 72 0x450 2 x
248
+ 0_0.cc 72 0x456
249
+ 0_0.cc 72 0x460
250
+ 0_0.cc 72 0x464
251
+ 0_0.cc 72 0x468
252
+ 0_0.cc 67 0x470
253
+ 0_0.cc 67 0x47c
254
+
255
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
256
+ tile_control.h 147 0x480
257
+ tile_control.h 147 0x480 1
258
+
259
+ 0_0/src/0_0.cc:
260
+ 0_0.cc 49 0x480 2
261
+ 0_0.cc 50 0x480 3
262
+ 0_0.cc 55 0x480 4
263
+ 0_0.cc 55 0x480 5
264
+ 0_0.cc 59 0x480 6
265
+ 0_0.cc 59 0x480 7
266
+ 0_0.cc 63 0x480 8
267
+ 0_0.cc 64 0x480 9
268
+ 0_0.cc 67 0x480 10
269
+ 0_0.cc 78 0x480 11
270
+ 0_0.cc 55 0x48a
271
+ 0_0.cc 74 0x494 x
272
+ 0_0.cc 75 0x498
273
+ 0_0.cc 75 0x49c
274
+ 0_0.cc 55 0x4a4 x
275
+ 0_0.cc 74 0x4ac
276
+ 0_0.cc 75 0x4b2 x
277
+ 0_0.cc 75 0x4b6
278
+ 0_0.cc 78 0x4ba
279
+ 0_0.cc 78 0x4ba 1 x
280
+ 0_0.cc 79 0x4ba 2
281
+ 0_0.cc 79 0x4ba 3
282
+ 0_0.cc 80 0x4ba 4
283
+ 0_0.cc 80 0x4ba 5
284
+ 0_0.cc 78 0x4c6
285
+ 0_0.cc 79 0x4c6 1
286
+ 0_0.cc 80 0x4c6 2
287
+ 0_0.cc 78 0x4d0
288
+ 0_0.cc 79 0x4d0 1
289
+ 0_0.cc 81 0x4d0 2
290
+
291
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
292
+ io_buffer_compiler.h 564 0x4da
293
+ io_buffer_compiler.h 565 0x4da 1
294
+ io_buffer_compiler.h 572 0x4da 2
295
+
296
+ 0_0/src/0_0.cc:
297
+ 0_0.cc 79 0x4da 3 x
298
+ 0_0.cc 79 0x4e0
299
+ 0_0.cc 81 0x4e4
300
+ 0_0.cc 78 0x4f0 x
301
+ 0_0.cc 79 0x4f4 x
302
+ 0_0.cc 80 0x4f8 x
303
+ 0_0.cc 80 0x500
304
+ 0_0.cc 81 0x50a x
305
+ 0_0.cc 29 0x50e
306
+
307
+ /usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h:
308
+ tile_control.h 278 0x518
309
+ tile_control.h 278 0x518 1
310
+ tile_control.h 278 0x518 2
311
+
312
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
313
+ io_buffer_compiler.h 566 0x518 3
314
+ io_buffer_compiler.h 567 0x518 4
315
+
316
+ 0_0/src/0_0.cc:
317
+ 0_0.cc 19 0x518 5
318
+
319
+ /usr/local/lib/python3.10/dist-packages/include/adf/io_buffer/io_buffer_compiler.h:
320
+ io_buffer_compiler.h 564 0x530
321
+ io_buffer_compiler.h - 0x531
322
+
323
+
324
+ CU: No directory table
325
+ CU: Empty file name table
326
+ <unknown> - 0x1
327
+
328
+
329
+ CU: ./me_basic.c:
330
+ File name Line number Starting address View Stmt
331
+
332
+ ./me_basic.c:[++]
333
+ me_basic.c 73 0x5f0 x
334
+ me_basic.c 73 0x5f0 1
335
+ me_basic.c 75 0x5f6
336
+ me_basic.c 76 0x5f6 1
337
+ me_basic.c 75 0x600
338
+ me_basic.c 75 0x600 1
339
+ me_basic.c 75 0x60a x
340
+ me_basic.c 76 0x60a 1
341
+ me_basic.c 75 0x610
342
+ me_basic.c 76 0x630 x
343
+ me_basic.c 76 0x640
344
+ me_basic.c 75 0x644
345
+ me_basic.c 75 0x650 x
346
+ me_basic.c 75 0x654
347
+ me_basic.c 77 0x670
348
+ me_basic.c 77 0x686 x
349
+ me_basic.c 77 0x68a
350
+ me_basic.c 91 0 x
351
+ me_basic.c 87 0 1 x
352
+ me_basic.c 69 0x6
353
+ me_basic.c 69 0x6 1
354
+ me_basic.c 69 0xc
355
+ me_basic.c 69 0x12 x
356
+ me_basic.c 69 0x16
357
+ me_basic.c 98 0x26
358
+ me_basic.c 98 0x26 1
359
+ me_basic.c 69 0x30
360
+ me_basic.c 70 0x30 1
361
+ me_basic.c 69 0x40
362
+ me_basic.c 70 0x40 1 x
363
+ me_basic.c 70 0x52
364
+ me_basic.c 69 0x60 x
365
+ me_basic.c 69 0x64
366
+ me_basic.c 98 0x74
367
+ me_basic.c 98 0x74 1
368
+ me_basic.c 98 0x80 x
369
+
370
+ runtime/include/stdlib.h:
371
+ stdlib.h 77 0x90 x
372
+ stdlib.h 77 0x96
373
+ stdlib.h 61 0xbc x
374
+ stdlib.h 62 0xcc x
375
+ stdlib.h 64 0xd0 x
376
+ stdlib.h - 0xd1
377
+
378
+
379
+ CU: src/atexit.c:
380
+ File name Line number Starting address View Stmt
381
+
382
+ src/atexit.c:
383
+ atexit.c 47 0x6a0 x
384
+ atexit.c 47 0x6a0 1
385
+ atexit.c 55 0x6a0 2
386
+ atexit.c 53 0x6aa
387
+ atexit.c 52 0x6cc
388
+ atexit.c 53 0x6cc 1
389
+ atexit.c 52 0x6d6 x
390
+ atexit.c 53 0x6ec x
391
+ atexit.c 54 0x704 x
392
+ atexit.c 55 0x70a x
393
+ atexit.c 56 0x728
394
+ atexit.c 56 0x72e x
395
+ atexit.c 60 0x732
396
+ atexit.c 63 0x740 x
397
+ atexit.c 63 0x744
398
+ atexit.c 63 0x752
399
+ atexit.c 60 0x770 x
400
+ atexit.c 66 0x780
401
+ atexit.c 66 0x7c2 x
402
+ atexit.c 66 0x7c8
403
+ atexit.c - 0x7c9
404
+
405
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:801429b6a86c59d0a139acc086a4c0b19dea4fcf010750b8af911795779b3ef7
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1545a2de7f8e377ec48bc84db8572b4a4733a86ba5f59ba34b08237b130101c4
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eb16cc09bc51217dbd78f0fa4ff8c297513bb3ab6176fd7c20784771e643ea4
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92cc167047680f0cdc082b8dd4e48e6b44c0246ebe906740d3ffef91d5997a91
3
+ size 384
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:801429b6a86c59d0a139acc086a4c0b19dea4fcf010750b8af911795779b3ef7
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1545a2de7f8e377ec48bc84db8572b4a4733a86ba5f59ba34b08237b130101c4
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eb16cc09bc51217dbd78f0fa4ff8c297513bb3ab6176fd7c20784771e643ea4
3
+ size 296
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/scripts/0_0.bcf ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _reserved DMb 0x0 0x40000
2
+
3
+ _reserved PM 0x930 0x36d0 //reserved for reloadable elfs
4
+
5
+ _entry_point _main_init
6
+ _symbol _main _after _main_init
7
+ _symbol _main_init 0x0
8
+ _symbol _Z13kernelWrapperPPvjjjj 0x930
9
+ _extern _Z13kernelWrapperPPvjjjj
10
+
11
+ _symbol lcpPing 0x7b280
12
+ _symbol lcpPong 0x7b680
13
+ _reserved DMb 0x7ba80 0x40 //reserved for sync buffer
14
+ _stack DM_stack 0x7bac0 0x940 //stack for core
15
+ //space for synopsys compiler at 0x7c400 0x40//heap
16
+ _reserved DMb 0x7c440 0x880 //reserved for reloadable elf heap
17
+ _reserved DMb 0x40000 0x3b280
18
+
19
+ _reserved DMb 0x7ccc0 0x3340
20
+ _reserved DMb 0x80000 0x80000 // And everything else the core can't see
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/scripts/0_0.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <file type="lbc" name="0_0.ll" path="../../ir"/>
3
+ <issinit/>
4
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
5
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
6
+ <option id="llvm.lang" value="Follow file extension"/>
7
+ <option id="bridge.cfg" value="0_0.bcf"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/0_0"/>
10
+ <option id="project.name" value="0_0"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/src/0_0.cc ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+ extern void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut);
8
+ uint32 lcpPing[256];
9
+ uint32 lcpPong[256];
10
+
11
+ int main(void)
12
+ {
13
+
14
+ while (true)
15
+ {
16
+ //initialize locks for layer control parameters
17
+ adf::initialize_lock(14, 0);
18
+ adf::initialize_lock(15, 0);
19
+ acquire_equal(62, 1);
20
+ uint32* lcp = lcpPing;
21
+ uint32 idx = 0;
22
+ constexpr int const maxKernelPorts = 5;
23
+ adf::_io_buffer_light_weight_generic ioBufPorts[4] = {};
24
+
25
+ while (true)
26
+ {
27
+ void* args[1 + maxKernelPorts];
28
+ uint32 numArgs = 0;
29
+ uint32 loop_cnt0 = lcp[idx++];
30
+ uint32 numSyncInPorts = lcp[idx++];
31
+ uint32 numAsyncInPorts = lcp[idx++];
32
+ uint32 numSyncOutPorts = lcp[idx++];
33
+ uint32 numAsyncOutPorts = lcp[idx++];
34
+ uint32 numIoBufPorts = numSyncInPorts + numAsyncInPorts + numSyncOutPorts + numAsyncOutPorts;
35
+ uint32 numRtpPorts = lcp[idx++];
36
+
37
+ for (int i = 0; i < numIoBufPorts; ++i)
38
+ chess_loop_range(2,4)
39
+ {
40
+ new(&ioBufPorts[numArgs]) adf::_io_buffer_light_weight_generic{(void*)lcp[idx+0], lcp[idx+1], (void*)lcp[idx+2], lcp[idx+3]};
41
+ args[numArgs] = &ioBufPorts[numArgs];
42
+ numArgs += 1;
43
+ idx += 4;
44
+ }
45
+
46
+ for (int i = 0; i < numRtpPorts; i++)
47
+ chess_loop_range(1,1)
48
+ {
49
+ uint32 numRtpValues = lcp[idx];
50
+ args[numArgs] = &lcp[idx+1];
51
+ numArgs++;
52
+ idx += (numRtpValues+1);
53
+ }
54
+
55
+ for(int lc0 = 0, lcp_size0 = 0; lc0 < loop_cnt0; lc0++)
56
+ chess_loop_range(1,)
57
+ {
58
+ idx -= lcp_size0;
59
+ adf::block_write((adf::reg_val*)(&lcp[idx+1]), lcp[idx]);
60
+ uint32 numBlockWrite1 = lcp[idx] * 2 + 1;
61
+ idx += numBlockWrite1;
62
+ // Wait previous layer mm2s channel done
63
+ adf::wait_dma_channel_done(lcp[idx++]);
64
+ adf::block_write((adf::reg_val*)(&lcp[idx+1]), lcp[idx]);
65
+ uint32 numBlockWrite2 = lcp[idx] * 2 + 1;
66
+ idx += numBlockWrite2;
67
+ for (int lc1 = 0, loop_cnt1 = lcp[idx]; lc1 < loop_cnt1; lc1++)
68
+ chess_loop_range(1,)
69
+ {
70
+ if(lc0 == 0 && lc1 == 0 && lcp[idx+1])
71
+ done();
72
+ kernelWrapper(args, lcp[idx+2], numSyncInPorts, numAsyncInPorts, numSyncOutPorts);
73
+ }
74
+ idx += 3;
75
+ lcp_size0 = numBlockWrite1 + numBlockWrite2 + 4;
76
+ }
77
+
78
+ bool isLastLayer = lcp[idx];
79
+ release((lcp == lcpPing ? 62 : 63), -1);
80
+ acquire_equal((lcp == lcpPing ? 63 : 62), 1, !isLastLayer);
81
+ lcp = (lcp == lcpPing ? lcpPong : lcpPing);
82
+ idx = 0;
83
+
84
+ if (isLastLayer)
85
+ break;
86
+ }
87
+ }
88
+
89
+ return 0;
90
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/timestamped_log/0_0.log ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
2
+ Configuration: Release_LLVM
3
+ Compiling "0_0.ll"
4
+ chess-clang --chess-proc-dir=/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -S -O2 -std=c++2a -fno-builtin-memcpy -mllvm -instcombine-code-sinking=false -mllvm -disable-lsr -mllvm -replexitval=never -mllvm -enable-load-pre=false -mllvm -chess-disable-add-to-or -mllvm -chess-combine-gep-indices=none -mllvm -chess-disable-fold-phi-of-loads -mllvm -chess-aainfo2chains-algo=4 -mllvm -chess-aggressive-aainfo=false -mllvm -chess-enable-indvarsimplify=0 -mllvm -chess-disable-cse-across-loopboundary -mllvm -chess-tbaa-detect-common-underlying-object=true -mllvm -chess-protect-llvm-global-reg-access=true -fno-jump-tables -fno-discard-value-names -g ../../ir/0_0.ll -o../Release/chesswork848/0_0.sfg --chess-proc-name=me
5
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
6
+ noodle -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -iaie_core.h +Sinl +Olbb=200 +Opmsa +NOpld +Olzyinl +w../Release/chesswork848 ../Release/chesswork848/0_0.sfg +Q1=+Sinl,+Olbb=200,+Opmsa,+NOpld,+Olzyinl +Q2=+Sinl,+Olbb=200,+Opmsa,+NOpld,+Olzyinl +Q3=+Sinl,+Olbb=1000,+Opmsa,+NOpld,+Olzyinl +Qfast=+Sinl,+Olbb=1000,+Opmsa,+NOpld,+Olzyinl,+Opfp +Qs=+Sinl,+Olbb=200,+Opmsa,+NOpld,+Olzyinl +Qz=+Sinl,+Olbb=200,+Opmsa,+NOpld,+Olzyinl me
7
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
8
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
9
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
10
+ chess-backend 0_0-F_ZN3adf11block_writeEPKNS_7reg_valEj_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation --print-subtools --cosel -m +ef +s -M3 --amnesia -p10 -q2 -ecrSCDEn -ecrMCDEn -ecrVaddSign -ecrUnpackSign -ecrPackSign -ecrUPSSign -ecrUPSMode -ecrSRSSign -ecrSRSMode -ecrF2IMask -ecrUnpackSize -ecrPackSize -ecrSat -ecrRnd +Oefc +Opbr +Odhls +Oprefer-local-reg-moves -Onocb --mist1 -k64 --showcolor -b -Obbl --mist2 -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 +Omod -k64 +Omsbr=100 +Opnll +A +pnopALU +pnopLDA +pnopLDB +pnopSTS +pnopVEC +Ofexm +Omsanafs +Onzmem +Onombt +Ochex +Omsmfi +Omslactc=lckLdaRsrc_E1,lckLdbRsrc_E1:2 +Odra +Oslr=crSRSSign +Oslr=crUPSMode +Oslr=crSRSMode +Oslr=crRnd +Oslr=crSat +Onop-syntax=NOPA +Onop-syntax=NOPB +Onop-syntax=NOPM +Onop-syntax=NOPV +Onop-syntax=NOPS +Onop-syntax=NOPX +Onop-syntax=NOPXM --tale -g -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -V0_0 -L
11
+ chess-backend 0_0-main_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation -x --print-subtools --cosel -m +ef +s -M3 --amnesia -p10 -q2 -ecrSCDEn -ecrMCDEn -ecrVaddSign -ecrUnpackSign -ecrPackSign -ecrUPSSign -ecrUPSMode -ecrSRSSign -ecrSRSMode -ecrF2IMask -ecrUnpackSize -ecrPackSize -ecrSat -ecrRnd +Oefc +Opbr +Odhls +Oprefer-local-reg-moves -Onocb --mist1 -k64 --showcolor -b -Obbl --mist2 -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 +Omod -k64 +Omsbr=100 +Opnll +A +pnopALU +pnopLDA +pnopLDB +pnopSTS +pnopVEC +Ofexm +Omsanafs +Onzmem +Onombt +Ochex +Omsmfi +Omslactc=lckLdaRsrc_E1,lckLdbRsrc_E1:2 +Odra +Oslr=crSRSSign +Oslr=crUPSMode +Oslr=crSRSMode +Oslr=crRnd +Oslr=crSat +Onop-syntax=NOPA +Onop-syntax=NOPB +Onop-syntax=NOPM +Onop-syntax=NOPV +Onop-syntax=NOPS +Onop-syntax=NOPX +Onop-syntax=NOPXM --tale -g -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -V0_0 -L
12
+ chess-backend --gvt me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation --tale -g -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -V0_0 -L
13
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
14
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
15
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
16
+ --cosel -m +ef +s -M3 --common 0_0-F_ZN3adf11block_writeEPKNS_7reg_valEj_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation
17
+ --cosel -m +ef +s -M3 --common 0_0-main_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation -x
18
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
19
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
20
+ --amnesia -p10 -q2 -ecrSCDEn -ecrMCDEn -ecrVaddSign -ecrUnpackSign -ecrPackSign -ecrUPSSign -ecrUPSMode -ecrSRSSign -ecrSRSMode -ecrF2IMask -ecrUnpackSize -ecrPackSize -ecrSat -ecrRnd +Oefc +Opbr +Odhls +Oprefer-local-reg-moves -Onocb --common 0_0-F_ZN3adf11block_writeEPKNS_7reg_valEj_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation
21
+ --mist1 -k64 --common 0_0-F_ZN3adf11block_writeEPKNS_7reg_valEj_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation
22
+ --amnesia -p10 -q2 -ecrSCDEn -ecrMCDEn -ecrVaddSign -ecrUnpackSign -ecrPackSign -ecrUPSSign -ecrUPSMode -ecrSRSSign -ecrSRSMode -ecrF2IMask -ecrUnpackSize -ecrPackSize -ecrSat -ecrRnd +Oefc +Opbr +Odhls +Oprefer-local-reg-moves -Onocb --common 0_0-main_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation -x
23
+ --showcolor -b -Obbl --common 0_0-F_ZN3adf11block_writeEPKNS_7reg_valEj_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation
24
+ --mist2 -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 +Omod -k64 +Omsbr=100 +Opnll +A +pnopALU +pnopLDA +pnopLDB +pnopSTS +pnopVEC +Ofexm +Omsanafs +Onzmem +Onombt +Ochex +Omsmfi +Omslactc=lckLdaRsrc_E1,lckLdbRsrc_E1:2 +Odra +Oslr=crSRSSign +Oslr=crUPSMode +Oslr=crSRSMode +Oslr=crRnd +Oslr=crSat +Onop-syntax=NOPA +Onop-syntax=NOPB +Onop-syntax=NOPM +Onop-syntax=NOPV +Onop-syntax=NOPS +Onop-syntax=NOPX +Onop-syntax=NOPXM --common 0_0-F_ZN3adf11block_writeEPKNS_7reg_valEj_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation
25
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
26
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
27
+ Warning in "/usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h", line 292, column 8: in "/usr/local/lib/python3.10/dist-packages/include/adf/aie/tile_control.h", line 292: (loop #8)
28
+ loop software pipelining (to 2 cycles) is feasible for a minimum loop count of 5,
29
+ but requires the creation of a post-amble, for which the loop was not prepared
30
+ ... consider annotating the loop with `chess_prepare_for_pipelining', as well as
31
+ increasing the current `chess_loop_range(1,)` annotation to `chess_loop_range(5,)', or remove it.
32
+
33
+ --tale -g -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -V0_0 -L --common 0_0-F_ZN3adf11block_writeEPKNS_7reg_valEj_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation
34
+ --mist1 -k64 --common 0_0-main_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation -x
35
+ --showcolor -b -Obbl --common 0_0-main_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation -x
36
+ --mist2 -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 +Omod -k64 +Omsbr=100 +Opnll +A +pnopALU +pnopLDA +pnopLDB +pnopSTS +pnopVEC +Ofexm +Omsanafs +Onzmem +Onombt +Ochex +Omsmfi +Omslactc=lckLdaRsrc_E1,lckLdbRsrc_E1:2 +Odra +Oslr=crSRSSign +Oslr=crUPSMode +Oslr=crSRSMode +Oslr=crRnd +Oslr=crSat +Onop-syntax=NOPA +Onop-syntax=NOPB +Onop-syntax=NOPM +Onop-syntax=NOPV +Onop-syntax=NOPS +Onop-syntax=NOPX +Onop-syntax=NOPXM --common 0_0-main_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation -x
37
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
38
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
39
+ Warning in "0_0/src/0_0.cc", line 37, column 12: in "0_0/src/0_0.cc", line 37: (loop #13)
40
+ loop software pipelining (to 8 cycles) is feasible but requires the creation of a post-amble,
41
+ for which the loop was not prepared
42
+ ... consider annotating the loop with `chess_prepare_for_pipelining'
43
+
44
+ Warning: in "0_0/src/0_0.cc", line 12: (loop #3)
45
+ Non leaf loop was prepared for pipelining. But the pipelined solutions have not been selected.
46
+ Consider removing the chess_prepare_for_pipelining directive as it may improve results
47
+ --tale -g -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -V0_0 -L --common 0_0-main_ me /usr/local/lib/python3.10/dist-packages/data/aie2p/lib +H/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/elongation -x
48
+ bridge -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -i -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 0_0.objlist -o../0_0.o -pme
49
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
50
+ darts -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -d -h -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -L +Ihex +nanno ../Release/0_0.o me
51
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
52
+ Linking "../Release/0_0"
53
+ bridge -o../Release/0_0 ../Release/0_0.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork848 -pme
54
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
55
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
56
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
57
+ darts -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -d -h -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -L +Ihex +nanno +u ../Release/0_0 me
58
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
59
+ Compilation finished successfully (19 errors, 3 warnings)
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/0_0_reloadable0.log ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.# ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ a801722880b2a598cbddce60c4dbea1c96a45e2c
2
+ 1a735f496f1284ab86135ede88939a8aeeb375a3
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.## ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 8ae2e4a70956e0d4852fb5c77bf78c97f18d259c
2
+ 92e103875c6a39bc8cdbe4a21c02c5a94ba3cc96
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.calltree ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:44:05 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable0 ../Release/0_0_reloadable0.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable0.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1033 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z13kernelWrapperPPvjjjj
10
+ _Z13_b881_wrapperPPv (referenced text)
11
+ _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
12
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
13
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
14
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
15
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
16
+ _Z13_b719_wrapperPPv (referenced text)
17
+ _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj
18
+ _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj
19
+ _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params
20
+ _Z13_b886_wrapperPPv (referenced text)
21
+ _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
22
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
23
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
24
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
25
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (*)
26
+ _Z13_b891_wrapperPPv (referenced text)
27
+ _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
28
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
29
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
30
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
31
+ _Z13_b896_wrapperPPv (referenced text)
32
+ _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
33
+ _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
34
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
35
+ _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
36
+ _Z13_b901_wrapperPPv (referenced text)
37
+ _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
38
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
39
+ _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
40
+ _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
41
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E
42
+ _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
43
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
44
+ _Z13_b906_wrapperPPv (referenced text)
45
+ _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
46
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
47
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
48
+
49
+
50
+ Call tree stack and functions sizes:
51
+
52
+ stack stack stack call func func function name
53
+ desc level level desc
54
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
55
+ 64 320 0 0 546 11410 _Z13kernelWrapperPPvjjjj
56
+ 0 256 1 1 32 1394 _Z13_b881_wrapperPPv
57
+ 64 256 1 2 488 1362 _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
58
+ 64 64 2 3 74 190 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
59
+ 0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
60
+ 64 192 2 3 150 684 _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
61
+ 128 128 3 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
62
+ 0 64 1 1 32 682 _Z13_b719_wrapperPPv
63
+ 64 64 1 2 114 650 _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj <tail call>
64
+ 0 0 2 3 74 74 _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj
65
+ 0 0 1 3 462 462 _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params <tail call>
66
+ 0 192 1 1 36 1402 _Z13_b886_wrapperPPv
67
+ 64 192 1 2 602 1366 _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
68
+ 64 64 2 3 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
69
+ 0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
70
+ 0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
71
+ 128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
72
+ 0 128 1 1 36 1092 _Z13_b891_wrapperPPv
73
+ 64 128 1 2 602 1056 _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
74
+ 64 64 2 3 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
75
+ 0 0 3 4 24 24 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
76
+ 0 0 2 3 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
77
+ 0 192 1 1 36 4714 _Z13_b896_wrapperPPv
78
+ 64 192 1 2 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
79
+ 64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
80
+ 128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
81
+ 0 0 3 4 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
82
+ 0 192 1 1 32 1252 _Z13_b901_wrapperPPv
83
+ 64 192 1 2 488 1220 _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
84
+ 64 128 2 3 62 304 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
85
+ 64 64 3 4 162 186 _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
86
+ 0 0 4 5 24 24 _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
87
+ 0 0 2 4 56 56 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E <tail call>
88
+ 128 128 2 3 114 428 _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
89
+ 0 0 3 4 314 314 _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
90
+ 0 64 1 1 32 862 _Z13_b906_wrapperPPv
91
+ 64 64 1 2 488 830 _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
92
+ 0 0 2 3 100 100 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
93
+ 0 0 2 3 242 242 _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
94
+
95
+
96
+ Maximum call level : 5
97
+ Maximum stack level: 4
98
+ Maximum stack size : 320
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.cmic2 ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.cmico ADDED
@@ -0,0 +1 @@
 
 
1
+ +Mdec
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.map ADDED
@@ -0,0 +1,295 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:44:06 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable0 ../Release/0_0_reloadable0.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable0.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1033 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ Memory map for memory 'DM_stack':
9
+
10
+ Size = 1048576
11
+ Width = 8 bits
12
+ Offset = 0
13
+ Used = 2368
14
+
15
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
16
+
17
+ Memory map for memory 'DMb':
18
+
19
+ Size = 1048576
20
+ Width = 8 bits
21
+ Offset = 0
22
+ Used = 3265
23
+
24
+ 0x00000000..0x0007babf ( 506560 items) : Reserved
25
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
26
+ 0x0007c400..0x0007c43f ( 64 items) : Reserved
27
+ 0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable0.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
28
+ 0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable0.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
29
+ 0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable0.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
30
+ 0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable0.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
31
+ 0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable0.o::_ZL8core_row (Data, Local, .bss.DMb.4)
32
+ 0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable0.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
33
+ 0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable0.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
34
+ 0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable0.o::_ZL8num_iter (Data, Local, .data.DMb.4)
35
+ 0x0007c460..0x0007c463 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
36
+ 0x0007c464..0x0007c464 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
37
+ 0x0007c480..0x0007c49b ( 28 items) : ../Release/0_0_reloadable0.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
38
+
39
+ Called functions : _Z13_b881_wrapperPPv
40
+ _Z13_b719_wrapperPPv
41
+ _Z13_b886_wrapperPPv
42
+ _Z13_b891_wrapperPPv
43
+ _Z13_b896_wrapperPPv
44
+ _Z13_b901_wrapperPPv
45
+ _Z13_b906_wrapperPPv
46
+
47
+ 0x0007c4c0..0x0007c4ff ( 64 items) : ../Release/0_0_reloadable0.o::_ZZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_KjE6params (Data, Weak, .bss.DMb.64)
48
+ 0x0007c500..0x0007c53f ( 64 items) : ../Release/0_0_reloadable0.o::add1d_attribute_broadcasting_params (Data, Global, .bss.DMb.64)
49
+ 0x0007c540..0x0007c57f ( 64 items) : ../Release/0_0_reloadable0.o::mul1d_attribute_broadcasting_params (Data, Global, .bss.DMb.64)
50
+ 0x0007c580..0x0007c5bf ( 64 items) : ../Release/0_0_reloadable0.o::add1d_params (Data, Global, .bss.DMb.64)
51
+ 0x0007c5c0..0x0007c5ff ( 64 items) : ../Release/0_0_reloadable0.o::mul1d_params (Data, Global, .bss.DMb.64)
52
+ 0x0007c600..0x0007c63f ( 64 items) : ../Release/0_0_reloadable0.o::clip1d_params (Data, Global, .bss.DMb.64)
53
+ 0x0007c640..0x0007c7ff ( 448 items) : ../Release/0_0_reloadable0.o::conv2d_params (Data, Global, .bss.DMb.64)
54
+ 0x0007ccc0..0x000fffff ( 537408 items) : Reserved
55
+
56
+ Memory map for memory 'PM':
57
+
58
+ Size = 1048576
59
+ Width = 8 bits
60
+ Offset = 0
61
+ Used = 11410
62
+
63
+ 0x00000000..0x0000092f ( 2352 items) : Reserved
64
+ 0x00000930..0x00000b51 ( 546 items) : ../Release/0_0_reloadable0.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
65
+
66
+ Referenced symbols: _ZL20g_uniformKernelFuncs
67
+
68
+ 0x00000b60..0x000010f5 ( 1430 items) : ../Release/0_0_reloadable0.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
69
+ 0x00001100..0x0000120d ( 270 items) : ../Release/0_0_reloadable0.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
70
+
71
+ Referenced symbols: _ZN12me_primitive11control_rndE
72
+
73
+ 0x00001210..0x00001b79 ( 2410 items) : ../Release/0_0_reloadable0.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
74
+
75
+ Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
76
+
77
+ Referenced symbols: _ZN12me_primitive11control_rndE
78
+
79
+ 0x00001b80..0x00001db7 ( 568 items) : ../Release/0_0_reloadable0.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
80
+
81
+ Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
82
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
83
+
84
+ Referenced symbols: _ZL9curr_iter
85
+ conv2d_params
86
+ _ZN12me_primitive11control_rndE
87
+ _ZN12me_primitive11control_satE
88
+ _ZL14num_depth_iter
89
+ _ZL8num_iter
90
+ _ZL10depth_iter
91
+ _ZL11total_iters
92
+
93
+ 0x00001dc0..0x00001dd7 ( 24 items) : ../Release/0_0_reloadable0.o::_ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
94
+ 0x00001de0..0x00001e81 ( 162 items) : ../Release/0_0_reloadable0.o::_ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
95
+
96
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E
97
+
98
+ 0x00001e90..0x00001ec7 ( 56 items) : ../Release/0_0_reloadable0.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
99
+ 0x00001ed0..0x00001f0d ( 62 items) : ../Release/0_0_reloadable0.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
100
+
101
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv
102
+ _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E
103
+
104
+ 0x00001f10..0x00002049 ( 314 items) : ../Release/0_0_reloadable0.o::_ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
105
+
106
+ Referenced symbols: _ZN12me_primitive11control_rndE
107
+
108
+ 0x00002050..0x000020c1 ( 114 items) : ../Release/0_0_reloadable0.o::_ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 128)
109
+
110
+ Called functions : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
111
+
112
+ 0x000020d0..0x000022b7 ( 488 items) : ../Release/0_0_reloadable0.o::_Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
113
+
114
+ Called functions : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv
115
+ _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E
116
+
117
+ Referenced symbols: _ZL9curr_iter
118
+ _ZL8core_row
119
+ add1d_attribute_broadcasting_params
120
+ _ZN12me_primitive11control_rndE
121
+ _ZN12me_primitive11control_satE
122
+ _ZL11ifm1_offset
123
+ _ZL8num_iter
124
+
125
+ 0x000022c0..0x00002323 ( 100 items) : ../Release/0_0_reloadable0.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
126
+ 0x00002330..0x00002421 ( 242 items) : ../Release/0_0_reloadable0.o::_ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
127
+ 0x00002430..0x00002617 ( 488 items) : ../Release/0_0_reloadable0.o::_Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
128
+
129
+ Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
130
+ _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
131
+
132
+ Referenced symbols: _ZL9curr_iter
133
+ _ZL8core_row
134
+ clip1d_params
135
+ _ZN12me_primitive11control_rndE
136
+ _ZN12me_primitive11control_satE
137
+ _ZL11ifm1_offset
138
+ _ZL8num_iter
139
+
140
+ 0x00002620..0x00002693 ( 116 items) : ../Release/0_0_reloadable0.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
141
+ 0x000026a0..0x000026e9 ( 74 items) : ../Release/0_0_reloadable0.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
142
+
143
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
144
+
145
+ 0x000026f0..0x00002905 ( 534 items) : ../Release/0_0_reloadable0.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
146
+
147
+ Referenced symbols: _ZN12me_primitive11control_rndE
148
+
149
+ 0x00002910..0x000029a5 ( 150 items) : ../Release/0_0_reloadable0.o::_ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 64)
150
+
151
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
152
+
153
+ 0x000029b0..0x00002b97 ( 488 items) : ../Release/0_0_reloadable0.o::_Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
154
+
155
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
156
+ _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E
157
+
158
+ Referenced symbols: _ZL9curr_iter
159
+ _ZL8core_row
160
+ mul1d_attribute_broadcasting_params
161
+ _ZN12me_primitive11control_rndE
162
+ _ZN12me_primitive11control_satE
163
+ _ZL11ifm1_offset
164
+ _ZL8num_iter
165
+
166
+ 0x00002ba0..0x00002c13 ( 116 items) : ../Release/0_0_reloadable0.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
167
+ 0x00002c20..0x00002c81 ( 98 items) : ../Release/0_0_reloadable0.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
168
+
169
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
170
+
171
+ 0x00002c90..0x00002c9f ( 16 items) : ../Release/0_0_reloadable0.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
172
+
173
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
174
+
175
+ 0x00002ca0..0x00002ef9 ( 602 items) : ../Release/0_0_reloadable0.o::_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
176
+
177
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
178
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
179
+
180
+ Referenced symbols: _ZL9curr_iter
181
+ _ZL8core_row
182
+ add1d_params
183
+ _ZN12me_primitive11control_rndE
184
+ _ZN12me_primitive11control_satE
185
+ _ZL11ifm1_offset
186
+ _ZL11ifm2_offset
187
+ _ZL8num_iter
188
+
189
+ 0x00002f00..0x00002f17 ( 24 items) : ../Release/0_0_reloadable0.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
190
+ 0x00002f20..0x00002fa9 ( 138 items) : ../Release/0_0_reloadable0.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
191
+
192
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
193
+
194
+ 0x00002fb0..0x000030d3 ( 292 items) : ../Release/0_0_reloadable0.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
195
+
196
+ Referenced symbols: _ZN12me_primitive11control_rndE
197
+
198
+ 0x000030e0..0x00003339 ( 602 items) : ../Release/0_0_reloadable0.o::_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
199
+
200
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
201
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
202
+
203
+ Referenced symbols: _ZL9curr_iter
204
+ _ZL8core_row
205
+ mul1d_params
206
+ _ZN12me_primitive11control_rndE
207
+ _ZN12me_primitive11control_satE
208
+ _ZL11ifm1_offset
209
+ _ZL11ifm2_offset
210
+ _ZL8num_iter
211
+
212
+ 0x00003340..0x0000335f ( 32 items) : ../Release/0_0_reloadable0.o::_Z13_b881_wrapperPPv (Function, Global, .text) (stack frame size = 0)
213
+
214
+ Called functions : _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
215
+
216
+ 0x00003360..0x000033a9 ( 74 items) : ../Release/0_0_reloadable0.o::_Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj (Function, Weak, .text) (stack frame size = 0)
217
+ 0x000033b0..0x0000357d ( 462 items) : ../Release/0_0_reloadable0.o::_Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params (Function, Weak, .text) (stack frame size = 0)
218
+ 0x00003580..0x000035f1 ( 114 items) : ../Release/0_0_reloadable0.o::_ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj (Function, Weak, .text) (stack frame size = 64)
219
+
220
+ Called functions : _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj
221
+ _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params
222
+
223
+ Referenced symbols: _ZZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_KjE6params
224
+
225
+ 0x00003600..0x0000361f ( 32 items) : ../Release/0_0_reloadable0.o::_Z13_b719_wrapperPPv (Function, Global, .text) (stack frame size = 0)
226
+
227
+ Called functions : _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj
228
+
229
+ 0x00003620..0x00003643 ( 36 items) : ../Release/0_0_reloadable0.o::_Z13_b886_wrapperPPv (Function, Global, .text) (stack frame size = 0)
230
+
231
+ Called functions : _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
232
+
233
+ 0x00003650..0x00003673 ( 36 items) : ../Release/0_0_reloadable0.o::_Z13_b891_wrapperPPv (Function, Global, .text) (stack frame size = 0)
234
+
235
+ Called functions : _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
236
+
237
+ 0x00003680..0x000036a3 ( 36 items) : ../Release/0_0_reloadable0.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
238
+
239
+ Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
240
+
241
+ 0x000036b0..0x000036cf ( 32 items) : ../Release/0_0_reloadable0.o::_Z13_b901_wrapperPPv (Function, Global, .text) (stack frame size = 0)
242
+
243
+ Called functions : _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
244
+
245
+ 0x000036d0..0x000036ef ( 32 items) : ../Release/0_0_reloadable0.o::_Z13_b906_wrapperPPv (Function, Global, .text) (stack frame size = 0)
246
+
247
+ Called functions : _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
248
+
249
+
250
+ External symbols:
251
+
252
+ __dso_handle = 0x0
253
+ _ctors_end = 0x0
254
+ _ctors_start = 0x0
255
+ _dtors_end = 0x0
256
+ _dtors_start = 0x0
257
+ _pc_end = 0x36f0
258
+ _pc_start = 0x930
259
+ _sp_end_DM_stack = 0x7c400
260
+ _sp_start_DM_stack = 0x7bac0
261
+
262
+ Section summary for memory 'DM_stack':
263
+
264
+ .stack File
265
+ ---------- ----------
266
+ 2368
267
+ ---------- ----------
268
+ 2368 Total
269
+
270
+ Section summary for memory 'DMb':
271
+
272
+ .bss .data .rodata File
273
+ ---------- ---------- ---------- ----------
274
+ 860 4 28 ../Release/0_0_reloadable0.o
275
+ 5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
276
+ ---------- ---------- ---------- ----------
277
+ 865 4 28 Total
278
+
279
+ Section summary for memory 'PM':
280
+
281
+ .text File
282
+ ---------- ----------
283
+ 11410 ../Release/0_0_reloadable0.o
284
+ ---------- ----------
285
+ 11410 Total
286
+
287
+ File summary:
288
+
289
+ ../Release/0_0_reloadable0.o
290
+ DMb 892
291
+ PM 11410
292
+
293
+ me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
294
+ DMb 5
295
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.o.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.sdr ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:44:06 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable0 ../Release/0_0_reloadable0.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable0.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1033 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ // Symbols in memory 'DM_bankA':
9
+ // Symbols in memory 'DM_bankAB':
10
+ // Symbols in memory 'DM_bankAC':
11
+ // Symbols in memory 'DM_bankAD':
12
+ // Symbols in memory 'DM_bankB':
13
+ // Symbols in memory 'DM_bankBC':
14
+ // Symbols in memory 'DM_bankBD':
15
+ // Symbols in memory 'DM_bankC':
16
+ // Symbols in memory 'DM_bankCD':
17
+ // Symbols in memory 'DM_bankD':
18
+ // Symbols in memory 'DM_stack':
19
+ // Symbols in memory 'DM_test':
20
+ // Symbols in memory 'DMb':
21
+ _symbol _ZN12me_primitive11control_satE 0x0007c460
22
+ _symbol _ZN12me_primitive11control_rndE 0x0007c464
23
+ _symbol _ZZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_KjE6params 0x0007c4c0
24
+ _symbol add1d_attribute_broadcasting_params 0x0007c500
25
+ _symbol mul1d_attribute_broadcasting_params 0x0007c540
26
+ _symbol add1d_params 0x0007c580
27
+ _symbol mul1d_params 0x0007c5c0
28
+ _symbol clip1d_params 0x0007c600
29
+ _symbol conv2d_params 0x0007c640
30
+ // Symbols in memory 'DMh':
31
+ // Symbols in memory 'DMh_bankA':
32
+ // Symbols in memory 'DMh_bankAB':
33
+ // Symbols in memory 'DMh_bankAC':
34
+ // Symbols in memory 'DMh_bankAD':
35
+ // Symbols in memory 'DMh_bankB':
36
+ // Symbols in memory 'DMh_bankBC':
37
+ // Symbols in memory 'DMh_bankBD':
38
+ // Symbols in memory 'DMh_bankC':
39
+ // Symbols in memory 'DMh_bankCD':
40
+ // Symbols in memory 'DMh_bankD':
41
+ // Symbols in memory 'DMh_stack':
42
+ // Symbols in memory 'DMs':
43
+ // Symbols in memory 'DMs_bankA':
44
+ // Symbols in memory 'DMs_bankAB':
45
+ // Symbols in memory 'DMs_bankAC':
46
+ // Symbols in memory 'DMs_bankAD':
47
+ // Symbols in memory 'DMs_bankB':
48
+ // Symbols in memory 'DMs_bankBC':
49
+ // Symbols in memory 'DMs_bankBD':
50
+ // Symbols in memory 'DMs_bankC':
51
+ // Symbols in memory 'DMs_bankCD':
52
+ // Symbols in memory 'DMs_bankD':
53
+ // Symbols in memory 'DMs_stack':
54
+ // Symbols in memory 'DMv':
55
+ // Symbols in memory 'DMv_bankA':
56
+ // Symbols in memory 'DMv_bankAB':
57
+ // Symbols in memory 'DMv_bankAC':
58
+ // Symbols in memory 'DMv_bankAD':
59
+ // Symbols in memory 'DMv_bankB':
60
+ // Symbols in memory 'DMv_bankBC':
61
+ // Symbols in memory 'DMv_bankBD':
62
+ // Symbols in memory 'DMv_bankC':
63
+ // Symbols in memory 'DMv_bankCD':
64
+ // Symbols in memory 'DMv_bankD':
65
+ // Symbols in memory 'DMv_stack':
66
+ // Symbols in memory 'DMw':
67
+ // Symbols in memory 'DMw_bankA':
68
+ // Symbols in memory 'DMw_bankAB':
69
+ // Symbols in memory 'DMw_bankAC':
70
+ // Symbols in memory 'DMw_bankAD':
71
+ // Symbols in memory 'DMw_bankB':
72
+ // Symbols in memory 'DMw_bankBC':
73
+ // Symbols in memory 'DMw_bankBD':
74
+ // Symbols in memory 'DMw_bankC':
75
+ // Symbols in memory 'DMw_bankCD':
76
+ // Symbols in memory 'DMw_bankD':
77
+ // Symbols in memory 'DMw_stack':
78
+ // Symbols in memory 'DMx':
79
+ // Symbols in memory 'DMx_bankA':
80
+ // Symbols in memory 'DMx_bankAB':
81
+ // Symbols in memory 'DMx_bankAC':
82
+ // Symbols in memory 'DMx_bankAD':
83
+ // Symbols in memory 'DMx_bankB':
84
+ // Symbols in memory 'DMx_bankBC':
85
+ // Symbols in memory 'DMx_bankBD':
86
+ // Symbols in memory 'DMx_bankC':
87
+ // Symbols in memory 'DMx_bankCD':
88
+ // Symbols in memory 'DMx_bankD':
89
+ // Symbols in memory 'DMx_stack':
90
+ // Symbols in memory 'PM':
91
+ _symbol _Z13kernelWrapperPPvjjjj 0x00000930
92
+ _symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000b60
93
+ _symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001100
94
+ _symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001210
95
+ _symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001b80
96
+ _symbol _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_E 0x00001dc0
97
+ _symbol _ZN18elementwise_binaryIJ8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS5_EPKv 0x00001de0
98
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_E 0x00001e90
99
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00001ed0
100
+ _symbol _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00001f10
101
+ _symbol _ZN41elementwise_binary_attribute_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_R27elementwise_binary_params_tIS5_E 0x00002050
102
+ _symbol _Z40superkernel_add1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000020d0
103
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x000022c0
104
+ _symbol _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002330
105
+ _symbol _Z18superkernel_clip1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002430
106
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00002620
107
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x000026a0
108
+ _symbol _ZN25elementwise_binary_sharedI8bfloat1626mul_impl_broadcasting_attrIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_R27elementwise_binary_params_tIS4_E 0x00002910
109
+ _symbol _Z40superkernel_mul1d_attribute_broadcastingRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000029b0
110
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00002ba0
111
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00002c20
112
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00002c90
113
+ _symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002ca0
114
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002f00
115
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002f20
116
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00002fb0
117
+ _symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x000030e0
118
+ _symbol _Z13_b881_wrapperPPv 0x00003340
119
+ _symbol _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj 0x00003360
120
+ _symbol _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params 0x000033b0
121
+ _symbol _ZN12mllib_graphs23transpose4d_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA5_Kj 0x00003580
122
+ _symbol _Z13_b719_wrapperPPv 0x00003600
123
+ _symbol _Z13_b886_wrapperPPv 0x00003620
124
+ _symbol _Z13_b891_wrapperPPv 0x00003650
125
+ _symbol _Z13_b896_wrapperPPv 0x00003680
126
+ _symbol _Z13_b901_wrapperPPv 0x000036b0
127
+ _symbol _Z13_b906_wrapperPPv 0x000036d0
128
+ // Symbols in memory 'PMw':
129
+ // Symbols in memory 'TM4':
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/Release/0_0_reloadable0.txt ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/scripts/0_0_reloadable0.bcf ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _reserved DMb 0x0 0x40000
2
+
3
+ _reserved PM 0x0 0x930 //reserved for main elf
4
+
5
+ _entry_point _Z13kernelWrapperPPvjjjj
6
+ _symbol _Z13kernelWrapperPPvjjjj 0x930
7
+
8
+ _reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
9
+ _reserved DMb 0x7ba80 0x40 //reserved for sync buffer
10
+ _stack DM_stack 0x7bac0 0x940 //stack for core
11
+ _reserved DMb 0x7c400 0x40 //reserved for main elf heap
12
+ //space for synopsys compiler at 0x7c440 0x880//heap
13
+ _reserved DMb 0x40000 0x3b280
14
+
15
+ _reserved DMb 0x7ccc0 0x3340
16
+ _reserved DMb 0x80000 0x80000 // And everything else the core can't see
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/scripts/0_0_reloadable0.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <file type="lbc" name="0_0_reloadable0.ll" path="../../ir"/>
3
+ <issinit/>
4
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
5
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
6
+ <option id="llvm.lang" value="Follow file extension"/>
7
+ <option id="bridge.cfg" value="0_0_reloadable0.bcf"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/0_0_reloadable0"/>
10
+ <option id="project.name" value="0_0_reloadable0"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/src/0_0_reloadable0.cc ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+
8
+ // Declare Kernel functions and initializers
9
+ void superkernel_mul1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
10
+ #include "transpose4d_adf_wrapper.cpp"
11
+ void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
12
+ void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
13
+ void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
14
+ void superkernel_add1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
15
+ void superkernel_clip1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
16
+
17
+ // Declare Kernel objects and external arrays
18
+
19
+
20
+ void _b881_wrapper(void* args[])
21
+ {
22
+ superkernel_mul1d_attribute_broadcasting(
23
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
24
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
25
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
26
+ }
27
+
28
+ void _b719_wrapper(void* args[])
29
+ {
30
+ mllib_graphs::transpose4d_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
31
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
32
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
33
+ *reinterpret_cast<uint32 const(*)[5]>(args[2]));
34
+ }
35
+
36
+ void _b886_wrapper(void* args[])
37
+ {
38
+ superkernel_add1d(
39
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
40
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
41
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
42
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
43
+ }
44
+
45
+ void _b891_wrapper(void* args[])
46
+ {
47
+ superkernel_mul1d(
48
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
49
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
50
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
51
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
52
+ }
53
+
54
+ void _b896_wrapper(void* args[])
55
+ {
56
+ conv2d_maxpool(
57
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
58
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
59
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
60
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
61
+ }
62
+
63
+ void _b901_wrapper(void* args[])
64
+ {
65
+ superkernel_add1d_attribute_broadcasting(
66
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
67
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
68
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
69
+ }
70
+
71
+ void _b906_wrapper(void* args[])
72
+ {
73
+ superkernel_clip1d(
74
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
75
+ *reinterpret_cast<uint32 const(*)[16]>(args[2]),
76
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
77
+ }
78
+
79
+ using UniformKernelFunc = void (*)(void **);
80
+
81
+ static UniformKernelFunc g_uniformKernelFuncs[7] = {
82
+ _b881_wrapper,
83
+ _b719_wrapper,
84
+ _b886_wrapper,
85
+ _b891_wrapper,
86
+ _b896_wrapper,
87
+ _b901_wrapper,
88
+ _b906_wrapper
89
+ };
90
+
91
+ __attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
92
+ {
93
+ uint32 idx = 0;
94
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
95
+ idx += (numSyncIn > 0) ? 1 : 0;
96
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
97
+ idx += (numSyncIn > 1) ? 1 : 0;
98
+ idx += numAsyncIn;
99
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::out>(numSyncOut > 0);
100
+ idx += (numSyncOut > 0) ? 1 : 0;
101
+
102
+ (*(g_uniformKernelFuncs[kernelId]))(args);
103
+
104
+ idx = 0;
105
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
106
+ idx += (numSyncIn > 0) ? 1 : 0;
107
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
108
+ idx += (numSyncIn > 1) ? 1 : 0;
109
+ idx += numAsyncIn;
110
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::out>(numSyncOut > 0);
111
+ idx += (numSyncOut > 0) ? 1 : 0;
112
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/timestamped_log/0_0_reloadable0.log ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable0/xlopt.log ADDED
@@ -0,0 +1,434 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
2
+
3
+
4
+ --------------- FILTER ANALYSIS INFO LOG ---------------
5
+
6
+ Reading Header IR from ir/_header.ll
7
+
8
+ --------------------------------------------------------
9
+
10
+ Add module pass 363{anonymous}::GuidancePass
11
+ Add module pass 363{anonymous}::ChessOptionsPass
12
+ Add module pass 363{anonymous}::DisableInliningInMainPass
13
+ Add module pass 363cdno::xlopt::AIEMergeSubWordStoresOpt
14
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::PromotePass>
15
+ Add module pass 363{anonymous}::IpConstPropPass
16
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::SimplifyCFGPass>
17
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::LoopSimplifyPass>
18
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::FunctionToLoopPassAdaptor>
19
+ Add module pass 363{anonymous}::XLModuleAdaptor<{anonymous}::AIELoopInfoPass>
20
+ Add module pass 363cdno::xlopt::AIEAnnotatePragmaPass
21
+ Add module pass 363{anonymous}::XLModuleAdaptor<{anonymous}::AIELoopPeelPass>
22
+ Add module pass 363{anonymous}::AIEAliasAnalysisPass
23
+
24
+
25
+ --------------- MEMORY MANAGEMENT GUIDANCE LOG ---------------
26
+
27
+ ALIGNMENT_HINT: Alignment of global array g_uniformKernelFuncs is 4 bytes; automatically aligning it to 64 bytes.
28
+ SIZE_HINT: Global array sigmoid_lut<0u, 256u>::data_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
29
+ SIZE_HINT: Global array sigmoid_lut<0u, 256u>::data_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
30
+ SIZE_HINT: Global array gelu_lut_32<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
31
+ SIZE_HINT: Global array gelu_lut_32<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
32
+ SIZE_HINT: Global array tanh_lut<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
33
+ SIZE_HINT: Global array tanh_lut<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
34
+ SIZE_HINT: Global array log_f32_lut<256u>::fraction_table_ab_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
35
+ SIZE_HINT: Global array log_f32_lut<256u>::fraction_table_cd_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
36
+ SIZE_HINT: Global array exp2_lut<512u>::exp2_table_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
37
+ SIZE_HINT: Global array exp2_lut<512u>::exp2_table_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
38
+
39
+ --------------------------------------------------------------
40
+
41
+
42
+
43
+ --------------- MERGING SUBWORD STORES OPT LOG ---------------
44
+
45
+
46
+
47
+ --------------- LOOP STATISTICS : _ZN18conv2d_bf16_paramsC2Ev ---------------
48
+
49
+ Total loops = 1
50
+ Loops with prepare for pipelining pragma = 0
51
+ Loops with unroll pragma = 0
52
+ Loops with flatten pragma = 0
53
+ Loops with min range pragma = 0
54
+ Loops with max range pragma = 0
55
+ Loops with known trip count = 0
56
+
57
+ -----------------------------------------------------------------------------
58
+
59
+
60
+
61
+ --------------- LOOP STATISTICS : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh ---------------
62
+
63
+ Total loops = 1
64
+ Loops with prepare for pipelining pragma = 0
65
+ Loops with unroll pragma = 0
66
+ Loops with flatten pragma = 0
67
+ Loops with min range pragma = 0
68
+ Loops with max range pragma = 0
69
+ Loops with known trip count = 1
70
+
71
+ -------------------------------------------------------------------------------------------------------------------
72
+
73
+
74
+
75
+ --------------- LOOP STATISTICS : _Z14conv2d_genericILh1EL5act_t0ELb0ELb1ELb0E8bfloat16EvPS1_S2_S2_S2_R18conv2d_bf16_params10out_mode_t ---------------
76
+
77
+ Total loops = 4
78
+ Loops with prepare for pipelining pragma = 4
79
+ Loops with unroll pragma = 0
80
+ Loops with flatten pragma = 0
81
+ Loops with min range pragma = 4
82
+ Loops with max range pragma = 0
83
+ Loops with known trip count = 0
84
+
85
+ -------------------------------------------------------------------------------------------------------------------------------------------------------
86
+
87
+
88
+
89
+ --------------- LOOP STATISTICS : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams ---------------
90
+
91
+ Total loops = 1
92
+ Loops with prepare for pipelining pragma = 1
93
+ Loops with unroll pragma = 0
94
+ Loops with flatten pragma = 0
95
+ Loops with min range pragma = 1
96
+ Loops with max range pragma = 0
97
+ Loops with known trip count = 0
98
+
99
+ -------------------------------------------------------------------------------------------------------------------
100
+
101
+
102
+
103
+ --------------- LOOP STATISTICS : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E ---------------
104
+
105
+ Total loops = 1
106
+ Loops with prepare for pipelining pragma = 1
107
+ Loops with unroll pragma = 0
108
+ Loops with flatten pragma = 0
109
+ Loops with min range pragma = 1
110
+ Loops with max range pragma = 0
111
+ Loops with known trip count = 0
112
+
113
+ ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
114
+
115
+
116
+
117
+ --------------- LOOP STATISTICS : _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj32EEELj2EEC2Ev ---------------
118
+
119
+ Total loops = 1
120
+ Loops with prepare for pipelining pragma = 0
121
+ Loops with unroll pragma = 0
122
+ Loops with flatten pragma = 0
123
+ Loops with min range pragma = 0
124
+ Loops with max range pragma = 0
125
+ Loops with known trip count = 0
126
+
127
+ --------------------------------------------------------------------------------------------------------
128
+
129
+
130
+
131
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
132
+
133
+ Total loops = 1
134
+ Loops with prepare for pipelining pragma = 1
135
+ Loops with unroll pragma = 0
136
+ Loops with flatten pragma = 0
137
+ Loops with min range pragma = 1
138
+ Loops with max range pragma = 0
139
+ Loops with known trip count = 0
140
+
141
+ -----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
142
+
143
+
144
+
145
+ --------------- LOOP STATISTICS : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE ---------------
146
+
147
+ Total loops = 1
148
+ Loops with prepare for pipelining pragma = 1
149
+ Loops with unroll pragma = 0
150
+ Loops with flatten pragma = 0
151
+ Loops with min range pragma = 1
152
+ Loops with max range pragma = 0
153
+ Loops with known trip count = 0
154
+
155
+ ---------------------------------------------------------------------------------------------------------------------------------------------------------------
156
+
157
+
158
+
159
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
160
+
161
+ Total loops = 1
162
+ Loops with prepare for pipelining pragma = 1
163
+ Loops with unroll pragma = 0
164
+ Loops with flatten pragma = 0
165
+ Loops with min range pragma = 1
166
+ Loops with max range pragma = 0
167
+ Loops with known trip count = 0
168
+
169
+ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
170
+
171
+
172
+
173
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
174
+
175
+ Total loops = 1
176
+ Loops with prepare for pipelining pragma = 1
177
+ Loops with unroll pragma = 0
178
+ Loops with flatten pragma = 0
179
+ Loops with min range pragma = 1
180
+ Loops with max range pragma = 0
181
+ Loops with known trip count = 0
182
+
183
+ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
184
+
185
+
186
+
187
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj32EEC2Eb ---------------
188
+
189
+ Total loops = 2
190
+ Loops with prepare for pipelining pragma = 0
191
+ Loops with unroll pragma = 2
192
+ Loops with flatten pragma = 0
193
+ Loops with min range pragma = 0
194
+ Loops with max range pragma = 0
195
+ Loops with known trip count = 2
196
+
197
+ -------------------------------------------------------------------------
198
+
199
+
200
+
201
+ --------------- LOOP STATISTICS : _Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E ---------------
202
+
203
+ Total loops = 1
204
+ Loops with prepare for pipelining pragma = 1
205
+ Loops with unroll pragma = 0
206
+ Loops with flatten pragma = 0
207
+ Loops with min range pragma = 1
208
+ Loops with max range pragma = 0
209
+ Loops with known trip count = 0
210
+
211
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------
212
+
213
+
214
+
215
+ --------------- LOOP STATISTICS : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E ---------------
216
+
217
+ Total loops = 1
218
+ Loops with prepare for pipelining pragma = 1
219
+ Loops with unroll pragma = 0
220
+ Loops with flatten pragma = 0
221
+ Loops with min range pragma = 1
222
+ Loops with max range pragma = 0
223
+ Loops with known trip count = 0
224
+
225
+ ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------
226
+
227
+
228
+
229
+ --------------- LOOP STATISTICS : _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh ---------------
230
+
231
+ Total loops = 1
232
+ Loops with prepare for pipelining pragma = 0
233
+ Loops with unroll pragma = 0
234
+ Loops with flatten pragma = 0
235
+ Loops with min range pragma = 0
236
+ Loops with max range pragma = 0
237
+ Loops with known trip count = 1
238
+
239
+ --------------------------------------------------------------------------------------------------------------
240
+
241
+
242
+
243
+ --------------- LOOP STATISTICS : _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params ---------------
244
+
245
+ Total loops = 2
246
+ Loops with prepare for pipelining pragma = 2
247
+ Loops with unroll pragma = 0
248
+ Loops with flatten pragma = 0
249
+ Loops with min range pragma = 2
250
+ Loops with max range pragma = 0
251
+ Loops with known trip count = 0
252
+
253
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
254
+
255
+
256
+
257
+ --------------- LOOP STATISTICS : _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E ---------------
258
+
259
+ Total loops = 2
260
+ Loops with prepare for pipelining pragma = 1
261
+ Loops with unroll pragma = 0
262
+ Loops with flatten pragma = 0
263
+ Loops with min range pragma = 1
264
+ Loops with max range pragma = 0
265
+ Loops with known trip count = 0
266
+
267
+ ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
268
+
269
+
270
+
271
+ --------------- LOOP STATISTICS : _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj16EEELj4EEC2Ev ---------------
272
+
273
+ Total loops = 1
274
+ Loops with prepare for pipelining pragma = 0
275
+ Loops with unroll pragma = 0
276
+ Loops with flatten pragma = 0
277
+ Loops with min range pragma = 0
278
+ Loops with max range pragma = 0
279
+ Loops with known trip count = 0
280
+
281
+ --------------------------------------------------------------------------------------------------------
282
+
283
+
284
+
285
+ --------------- LOOP STATISTICS : _ZN19reduce_mean_c8_implI8bfloat16E16body_postprocessEPvR18reduce_c8_params_tI23reduce_mean_c8_params_tIS0_EE ---------------
286
+
287
+ Total loops = 2
288
+ Loops with prepare for pipelining pragma = 2
289
+ Loops with unroll pragma = 0
290
+ Loops with flatten pragma = 0
291
+ Loops with min range pragma = 2
292
+ Loops with max range pragma = 0
293
+ Loops with known trip count = 0
294
+
295
+ ---------------------------------------------------------------------------------------------------------------------------------------------------------------
296
+
297
+
298
+
299
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj8EEC2Eb ---------------
300
+
301
+ Total loops = 2
302
+ Loops with prepare for pipelining pragma = 0
303
+ Loops with unroll pragma = 2
304
+ Loops with flatten pragma = 0
305
+ Loops with min range pragma = 0
306
+ Loops with max range pragma = 0
307
+ Loops with known trip count = 2
308
+
309
+ ------------------------------------------------------------------------
310
+
311
+
312
+
313
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj16EEC2Eb ---------------
314
+
315
+ Total loops = 2
316
+ Loops with prepare for pipelining pragma = 0
317
+ Loops with unroll pragma = 2
318
+ Loops with flatten pragma = 0
319
+ Loops with min range pragma = 0
320
+ Loops with max range pragma = 0
321
+ Loops with known trip count = 2
322
+
323
+ -------------------------------------------------------------------------
324
+
325
+
326
+
327
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj8EEeqERKS1_ ---------------
328
+
329
+ Total loops = 1
330
+ Loops with prepare for pipelining pragma = 0
331
+ Loops with unroll pragma = 1
332
+ Loops with flatten pragma = 0
333
+ Loops with min range pragma = 0
334
+ Loops with max range pragma = 0
335
+ Loops with known trip count = 1
336
+
337
+ -----------------------------------------------------------------------------
338
+
339
+
340
+
341
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj16EEeqERKS1_ ---------------
342
+
343
+ Total loops = 1
344
+ Loops with prepare for pipelining pragma = 0
345
+ Loops with unroll pragma = 1
346
+ Loops with flatten pragma = 0
347
+ Loops with min range pragma = 0
348
+ Loops with max range pragma = 0
349
+ Loops with known trip count = 1
350
+
351
+ ------------------------------------------------------------------------------
352
+
353
+
354
+
355
+ --------------- LOOP STATISTICS : _Z26pad_3d_bfloat16_simplifiedP8bfloat16S0_R15pad_3d_params_t ---------------
356
+
357
+ Total loops = 3
358
+ Loops with prepare for pipelining pragma = 0
359
+ Loops with unroll pragma = 0
360
+ Loops with flatten pragma = 0
361
+ Loops with min range pragma = 0
362
+ Loops with max range pragma = 0
363
+ Loops with known trip count = 0
364
+
365
+ ---------------------------------------------------------------------------------------------------------------
366
+
367
+
368
+
369
+ --------------- LOOP STATISTICS : _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj ---------------
370
+
371
+ Total loops = 1
372
+ Loops with prepare for pipelining pragma = 0
373
+ Loops with unroll pragma = 0
374
+ Loops with flatten pragma = 0
375
+ Loops with min range pragma = 0
376
+ Loops with max range pragma = 0
377
+ Loops with known trip count = 1
378
+
379
+ -------------------------------------------------------------------------------------------------------------------------------
380
+
381
+
382
+
383
+ --------------- LOOP STATISTICS : _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params ---------------
384
+
385
+ Total loops = 1
386
+ Loops with prepare for pipelining pragma = 0
387
+ Loops with unroll pragma = 0
388
+ Loops with flatten pragma = 0
389
+ Loops with min range pragma = 0
390
+ Loops with max range pragma = 0
391
+ Loops with known trip count = 0
392
+
393
+ --------------------------------------------------------------------------------------------------------------------------------------------------------
394
+
395
+
396
+
397
+ --------------- PRAGMA INSERTION LOG (unroll threshold = 3000, max unroll factor = 1) ---------------
398
+
399
+ Adding pragma to function _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh :
400
+ Pragma added to loop at line 437 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common/../../include/conv/conv2d_bf16_params.h : chess_loop_range(8,8)
401
+ Adding pragma to function _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj32EEELj2EEC2Ev :
402
+ Pragma added to loop at line 135 in file /usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite/../include/array : chess_prepare_for_pipelining
403
+ Adding pragma to function _ZN3aie4maskILj32EEC2Eb :
404
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
405
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
406
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
407
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
408
+ Adding pragma to function _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh :
409
+ Pragma added to loop at line 214 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common/../../include/conv/conv2d_dw_bf16_params.h : chess_loop_range(4,4)
410
+ Adding pragma to function _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj16EEELj4EEC2Ev :
411
+ Pragma added to loop at line 135 in file /usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite/../include/array : chess_prepare_for_pipelining
412
+ Adding pragma to function _ZN3aie4maskILj8EEC2Eb :
413
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
414
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
415
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
416
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
417
+ Adding pragma to function _ZN3aie4maskILj16EEC2Eb :
418
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
419
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
420
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
421
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
422
+ Adding pragma to function _ZNK3aie4maskILj16EEeqERKS1_ :
423
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
424
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
425
+ Adding pragma to function _ZNK3aie4maskILj8EEeqERKS1_ :
426
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
427
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
428
+ Adding pragma to function _Z29setup_transposeshuffle_paramsI8bfloat16EvR23transposeshuffle_paramsRA5_Kj :
429
+ Pragma added to loop at line 101 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/transposeshuffle_params.h : chess_loop_range(5,5)
430
+ Adding pragma to function _Z16transposeshuffleI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R23transposeshuffle_params :
431
+ Pragma added to loop at line 81 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc/transposeshuffle.h : chess_prepare_for_pipelining
432
+
433
+ -----------------------------------------------------------------------------------------------------
434
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/0_0_reloadable1.log ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.# ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 1af8aeb07082ccc8a3cbcd3ff871a10a837c51c4
2
+ 1a735f496f1284ab86135ede88939a8aeeb375a3
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.## ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ 0141eb3358383d634e67684112097cb573cff486
2
+ 92e103875c6a39bc8cdbe4a21c02c5a94ba3cc96
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.calltree ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:45:22 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable1 ../Release/0_0_reloadable1.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable1.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1394 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z13kernelWrapperPPvjjjj
10
+ _Z13_b919_wrapperPPv (referenced text)
11
+ _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
12
+ _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
13
+ _ZN12me_primitive10udiv_dstepEjjRjS0_
14
+ _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
15
+ _Z13_b924_wrapperPPv (referenced text)
16
+ _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE
17
+ _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
18
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
19
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
20
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
21
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
22
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
23
+ _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
24
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
25
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
26
+ _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
27
+ _Z13_b896_wrapperPPv (referenced text)
28
+ _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
29
+ _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (*)
30
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (*)
31
+
32
+
33
+ Call tree stack and functions sizes:
34
+
35
+ stack stack stack call func func function name
36
+ desc level level desc
37
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
38
+ 64 256 0 0 390 9538 _Z13kernelWrapperPPvjjjj
39
+ 0 192 1 1 36 2050 _Z13_b919_wrapperPPv
40
+ 128 192 1 2 478 2014 _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
41
+ 64 64 2 3 672 814 _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
42
+ 0 0 3 4 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
43
+ 0 0 2 3 722 722 _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
44
+ 0 192 1 1 40 6494 _Z13_b924_wrapperPPv
45
+ 64 192 1 2 1126 6454 _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE <tail call>
46
+ 64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
47
+ 64 64 2 3 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
48
+ 0 0 3 4 24 24 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
49
+ 64 64 2 3 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
50
+ 0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
51
+ 128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
52
+ 0 0 3 4 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
53
+ 0 0 2 3 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
54
+ 0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
55
+ 128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
56
+ 0 192 1 1 36 4714 _Z13_b896_wrapperPPv
57
+ 64 192 1 2 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
58
+ 64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
59
+ 128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (*)
60
+
61
+
62
+ Maximum call level : 4
63
+ Maximum stack level: 3
64
+ Maximum stack size : 256
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.cmic2 ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.cmico ADDED
@@ -0,0 +1 @@
 
 
1
+ +Mdec
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.map ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:45:23 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable1 ../Release/0_0_reloadable1.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable1.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1394 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ Memory map for memory 'DM_stack':
9
+
10
+ Size = 1048576
11
+ Width = 8 bits
12
+ Offset = 0
13
+ Used = 2368
14
+
15
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
16
+
17
+ Memory map for memory 'DMb':
18
+
19
+ Size = 1048576
20
+ Width = 8 bits
21
+ Offset = 0
22
+ Used = 3249
23
+
24
+ 0x00000000..0x0007babf ( 506560 items) : Reserved
25
+ 0x0007bac0..0x0007c3ff ( 2368 items) : Stack
26
+ 0x0007c400..0x0007c43f ( 64 items) : Reserved
27
+ 0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable1.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
28
+ 0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable1.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
29
+ 0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable1.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
30
+ 0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable1.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
31
+ 0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable1.o::_ZL8core_row (Data, Local, .bss.DMb.4)
32
+ 0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable1.o::_ZL10ifmsv_size (Data, Local, .bss.DMb.4)
33
+ 0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable1.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
34
+ 0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable1.o::_ZL8num_iter (Data, Local, .data.DMb.4)
35
+ 0x0007c460..0x0007c463 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
36
+ 0x0007c464..0x0007c464 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
37
+ 0x0007c480..0x0007c48b ( 12 items) : ../Release/0_0_reloadable1.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
38
+
39
+ Called functions : _Z13_b919_wrapperPPv
40
+ _Z13_b924_wrapperPPv
41
+ _Z13_b896_wrapperPPv
42
+
43
+ 0x0007c4c0..0x0007c4ff ( 64 items) : ../Release/0_0_reloadable1.o::add1d_params (Data, Global, .bss.DMb.64)
44
+ 0x0007c500..0x0007c53f ( 64 items) : ../Release/0_0_reloadable1.o::mul1d_params (Data, Global, .bss.DMb.64)
45
+ 0x0007c540..0x0007c6ff ( 448 items) : ../Release/0_0_reloadable1.o::conv2d_params (Data, Global, .bss.DMb.64)
46
+ 0x0007c700..0x0007c7ff ( 256 items) : ../Release/0_0_reloadable1.o::conv2d_dw_params (Data, Global, .bss.DMb.64)
47
+ 0x0007ccc0..0x000fffff ( 537408 items) : Reserved
48
+
49
+ Memory map for memory 'PM':
50
+
51
+ Size = 1048576
52
+ Width = 8 bits
53
+ Offset = 0
54
+ Used = 9538
55
+
56
+ 0x00000000..0x0000092f ( 2352 items) : Reserved
57
+ 0x00000930..0x00000ab5 ( 390 items) : ../Release/0_0_reloadable1.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
58
+
59
+ Referenced symbols: _ZL20g_uniformKernelFuncs
60
+
61
+ 0x00000ac0..0x00001055 ( 1430 items) : ../Release/0_0_reloadable1.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
62
+ 0x00001060..0x0000116d ( 270 items) : ../Release/0_0_reloadable1.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
63
+
64
+ Referenced symbols: _ZN12me_primitive11control_rndE
65
+
66
+ 0x00001170..0x00001ad9 ( 2410 items) : ../Release/0_0_reloadable1.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
67
+
68
+ Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
69
+
70
+ Referenced symbols: _ZN12me_primitive11control_rndE
71
+
72
+ 0x00001ae0..0x00001d17 ( 568 items) : ../Release/0_0_reloadable1.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
73
+
74
+ Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
75
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
76
+
77
+ Referenced symbols: _ZL9curr_iter
78
+ conv2d_params
79
+ _ZN12me_primitive11control_rndE
80
+ _ZN12me_primitive11control_satE
81
+ _ZL14num_depth_iter
82
+ _ZL8num_iter
83
+ _ZL10depth_iter
84
+ _ZL11total_iters
85
+
86
+ 0x00001d20..0x00001f35 ( 534 items) : ../Release/0_0_reloadable1.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
87
+
88
+ Referenced symbols: _ZN12me_primitive11control_rndE
89
+
90
+ 0x00001f40..0x00001fb3 ( 116 items) : ../Release/0_0_reloadable1.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
91
+ 0x00001fc0..0x00002021 ( 98 items) : ../Release/0_0_reloadable1.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
92
+
93
+ Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
94
+
95
+ 0x00002030..0x0000203f ( 16 items) : ../Release/0_0_reloadable1.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
96
+
97
+ Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
98
+
99
+ 0x00002040..0x00002057 ( 24 items) : ../Release/0_0_reloadable1.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
100
+ 0x00002060..0x000020e9 ( 138 items) : ../Release/0_0_reloadable1.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
101
+
102
+ Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
103
+
104
+ 0x000020f0..0x00002213 ( 292 items) : ../Release/0_0_reloadable1.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
105
+
106
+ Referenced symbols: _ZN12me_primitive11control_rndE
107
+
108
+ 0x00002220..0x000024bf ( 672 items) : ../Release/0_0_reloadable1.o::_ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh (Function, Local, .text) (stack frame size = 64)
109
+
110
+ Called functions : _ZN12me_primitive10udiv_dstepEjjRjS0_
111
+
112
+ Referenced symbols: conv2d_dw_params
113
+ _ZN12me_primitive11control_rndE
114
+
115
+ 0x000024c0..0x00002791 ( 722 items) : ../Release/0_0_reloadable1.o::_Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params (Function, Weak, .text) (stack frame size = 0)
116
+
117
+ Referenced symbols: _ZN12me_primitive11control_rndE
118
+
119
+ 0x000027a0..0x0000297d ( 478 items) : ../Release/0_0_reloadable1.o::_Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 128)
120
+
121
+ Called functions : _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh
122
+ _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params
123
+
124
+ Referenced symbols: _ZL9curr_iter
125
+ _ZL8core_row
126
+ _ZN12me_primitive11control_rndE
127
+ _ZN12me_primitive11control_satE
128
+ _ZL8num_iter
129
+ _ZL10ifmsv_size
130
+ conv2d_dw_params
131
+
132
+ 0x00002980..0x00002de5 ( 1126 items) : ../Release/0_0_reloadable1.o::_Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE (Function, Global, .text) (stack frame size = 64)
133
+
134
+ Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
135
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
136
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
137
+ _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
138
+ _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
139
+ _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
140
+
141
+ Referenced symbols: _ZL9curr_iter
142
+ _ZL8core_row
143
+ _ZN12me_primitive11control_rndE
144
+ _ZN12me_primitive11control_satE
145
+ conv2d_params
146
+ add1d_params
147
+ mul1d_params
148
+ _ZL14num_depth_iter
149
+ _ZL11ifm2_offset
150
+ _ZL8num_iter
151
+ _ZL10depth_iter
152
+ _ZL11total_iters
153
+
154
+ 0x00002df0..0x00002e13 ( 36 items) : ../Release/0_0_reloadable1.o::_Z13_b919_wrapperPPv (Function, Global, .text) (stack frame size = 0)
155
+
156
+ Called functions : _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
157
+
158
+ 0x00002e20..0x00002e47 ( 40 items) : ../Release/0_0_reloadable1.o::_Z13_b924_wrapperPPv (Function, Global, .text) (stack frame size = 0)
159
+
160
+ Called functions : _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE
161
+
162
+ 0x00002e50..0x00002e73 ( 36 items) : ../Release/0_0_reloadable1.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
163
+
164
+ Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
165
+
166
+ 0x00002e80..0x00002f0d ( 142 items) : me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive10udiv_dstepEjjRjS0_ (Function, Global, .text) (stack frame size = 0)
167
+
168
+ External symbols:
169
+
170
+ __dso_handle = 0x0
171
+ _ctors_end = 0x0
172
+ _ctors_start = 0x0
173
+ _dtors_end = 0x0
174
+ _dtors_start = 0x0
175
+ _pc_end = 0x2f0e
176
+ _pc_start = 0x930
177
+ _sp_end_DM_stack = 0x7c400
178
+ _sp_start_DM_stack = 0x7bac0
179
+
180
+ Section summary for memory 'DM_stack':
181
+
182
+ .stack File
183
+ ---------- ----------
184
+ 2368
185
+ ---------- ----------
186
+ 2368 Total
187
+
188
+ Section summary for memory 'DMb':
189
+
190
+ .bss .data .rodata File
191
+ ---------- ---------- ---------- ----------
192
+ 860 4 12 ../Release/0_0_reloadable1.o
193
+ 5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
194
+ ---------- ---------- ---------- ----------
195
+ 865 4 12 Total
196
+
197
+ Section summary for memory 'PM':
198
+
199
+ .text File
200
+ ---------- ----------
201
+ 9396 ../Release/0_0_reloadable1.o
202
+ 142 me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
203
+ ---------- ----------
204
+ 9538 Total
205
+
206
+ File summary:
207
+
208
+ ../Release/0_0_reloadable1.o
209
+ DMb 876
210
+ PM 9396
211
+
212
+ me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
213
+ DMb 5
214
+
215
+ me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
216
+ PM 142
217
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.o.lst ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.sdr ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:45:23 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable1 ../Release/0_0_reloadable1.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable1.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1394 -pme
5
+
6
+ // Release: ipp V-2024.06-TGT-241219
7
+
8
+ // Symbols in memory 'DM_bankA':
9
+ // Symbols in memory 'DM_bankAB':
10
+ // Symbols in memory 'DM_bankAC':
11
+ // Symbols in memory 'DM_bankAD':
12
+ // Symbols in memory 'DM_bankB':
13
+ // Symbols in memory 'DM_bankBC':
14
+ // Symbols in memory 'DM_bankBD':
15
+ // Symbols in memory 'DM_bankC':
16
+ // Symbols in memory 'DM_bankCD':
17
+ // Symbols in memory 'DM_bankD':
18
+ // Symbols in memory 'DM_stack':
19
+ // Symbols in memory 'DM_test':
20
+ // Symbols in memory 'DMb':
21
+ _symbol _ZN12me_primitive11control_satE 0x0007c460
22
+ _symbol _ZN12me_primitive11control_rndE 0x0007c464
23
+ _symbol add1d_params 0x0007c4c0
24
+ _symbol mul1d_params 0x0007c500
25
+ _symbol conv2d_params 0x0007c540
26
+ _symbol conv2d_dw_params 0x0007c700
27
+ // Symbols in memory 'DMh':
28
+ // Symbols in memory 'DMh_bankA':
29
+ // Symbols in memory 'DMh_bankAB':
30
+ // Symbols in memory 'DMh_bankAC':
31
+ // Symbols in memory 'DMh_bankAD':
32
+ // Symbols in memory 'DMh_bankB':
33
+ // Symbols in memory 'DMh_bankBC':
34
+ // Symbols in memory 'DMh_bankBD':
35
+ // Symbols in memory 'DMh_bankC':
36
+ // Symbols in memory 'DMh_bankCD':
37
+ // Symbols in memory 'DMh_bankD':
38
+ // Symbols in memory 'DMh_stack':
39
+ // Symbols in memory 'DMs':
40
+ // Symbols in memory 'DMs_bankA':
41
+ // Symbols in memory 'DMs_bankAB':
42
+ // Symbols in memory 'DMs_bankAC':
43
+ // Symbols in memory 'DMs_bankAD':
44
+ // Symbols in memory 'DMs_bankB':
45
+ // Symbols in memory 'DMs_bankBC':
46
+ // Symbols in memory 'DMs_bankBD':
47
+ // Symbols in memory 'DMs_bankC':
48
+ // Symbols in memory 'DMs_bankCD':
49
+ // Symbols in memory 'DMs_bankD':
50
+ // Symbols in memory 'DMs_stack':
51
+ // Symbols in memory 'DMv':
52
+ // Symbols in memory 'DMv_bankA':
53
+ // Symbols in memory 'DMv_bankAB':
54
+ // Symbols in memory 'DMv_bankAC':
55
+ // Symbols in memory 'DMv_bankAD':
56
+ // Symbols in memory 'DMv_bankB':
57
+ // Symbols in memory 'DMv_bankBC':
58
+ // Symbols in memory 'DMv_bankBD':
59
+ // Symbols in memory 'DMv_bankC':
60
+ // Symbols in memory 'DMv_bankCD':
61
+ // Symbols in memory 'DMv_bankD':
62
+ // Symbols in memory 'DMv_stack':
63
+ // Symbols in memory 'DMw':
64
+ // Symbols in memory 'DMw_bankA':
65
+ // Symbols in memory 'DMw_bankAB':
66
+ // Symbols in memory 'DMw_bankAC':
67
+ // Symbols in memory 'DMw_bankAD':
68
+ // Symbols in memory 'DMw_bankB':
69
+ // Symbols in memory 'DMw_bankBC':
70
+ // Symbols in memory 'DMw_bankBD':
71
+ // Symbols in memory 'DMw_bankC':
72
+ // Symbols in memory 'DMw_bankCD':
73
+ // Symbols in memory 'DMw_bankD':
74
+ // Symbols in memory 'DMw_stack':
75
+ // Symbols in memory 'DMx':
76
+ // Symbols in memory 'DMx_bankA':
77
+ // Symbols in memory 'DMx_bankAB':
78
+ // Symbols in memory 'DMx_bankAC':
79
+ // Symbols in memory 'DMx_bankAD':
80
+ // Symbols in memory 'DMx_bankB':
81
+ // Symbols in memory 'DMx_bankBC':
82
+ // Symbols in memory 'DMx_bankBD':
83
+ // Symbols in memory 'DMx_bankC':
84
+ // Symbols in memory 'DMx_bankCD':
85
+ // Symbols in memory 'DMx_bankD':
86
+ // Symbols in memory 'DMx_stack':
87
+ // Symbols in memory 'PM':
88
+ _symbol _Z13kernelWrapperPPvjjjj 0x00000930
89
+ _symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000ac0
90
+ _symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001060
91
+ _symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001170
92
+ _symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001ae0
93
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00001f40
94
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00001fc0
95
+ _symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00002030
96
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002040
97
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002060
98
+ _symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x000020f0
99
+ _symbol _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params 0x000024c0
100
+ _symbol _Z22superkernel_conv2d_dwcRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000027a0
101
+ _symbol _Z26superkernel_conv_eltbinaryRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERA17_KjRNS0_IS1_NS2_3outESH_EE 0x00002980
102
+ _symbol _Z13_b919_wrapperPPv 0x00002df0
103
+ _symbol _Z13_b924_wrapperPPv 0x00002e20
104
+ _symbol _Z13_b896_wrapperPPv 0x00002e50
105
+ _symbol _ZN12me_primitive10udiv_dstepEjjRjS0_ 0x00002e80
106
+ // Symbols in memory 'PMw':
107
+ // Symbols in memory 'TM4':
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.srv ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/Release/0_0_reloadable1.txt ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/scripts/0_0_reloadable1.bcf ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _reserved DMb 0x0 0x40000
2
+
3
+ _reserved PM 0x0 0x930 //reserved for main elf
4
+
5
+ _entry_point _Z13kernelWrapperPPvjjjj
6
+ _symbol _Z13kernelWrapperPPvjjjj 0x930
7
+
8
+ _reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
9
+ _reserved DMb 0x7ba80 0x40 //reserved for sync buffer
10
+ _stack DM_stack 0x7bac0 0x940 //stack for core
11
+ _reserved DMb 0x7c400 0x40 //reserved for main elf heap
12
+ //space for synopsys compiler at 0x7c440 0x880//heap
13
+ _reserved DMb 0x40000 0x3b280
14
+
15
+ _reserved DMb 0x7ccc0 0x3340
16
+ _reserved DMb 0x80000 0x80000 // And everything else the core can't see
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/scripts/0_0_reloadable1.prx ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <project name="Project" processor="me">
2
+ <file type="lbc" name="0_0_reloadable1.ll" path="../../ir"/>
3
+ <issinit/>
4
+ <option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
5
+ <option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
6
+ <option id="llvm.lang" value="Follow file extension"/>
7
+ <option id="bridge.cfg" value="0_0_reloadable1.bcf"/>
8
+ <option id="cpp.include" value="&lt;XILINX_VITIS_AIETOOLS&gt;/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/&lt;AIE_SRC_DIR&gt; " inherit="1"/>
9
+ <option id="project.dir" value="&lt;CONFIG&gt;/0_0_reloadable1"/>
10
+ <option id="project.name" value="0_0_reloadable1"/>
11
+ <option id="project.type" value="exe"/>
12
+ <option id="simrun.issca" value="&lt;XILINX_VITIS_AIETOOLS&gt;/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
13
+ </project>
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/src/0_0_reloadable1.cc ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // Automatically generated processor driver using AIEngine tool-chain
2
+
3
+ #include <stdio.h>
4
+ #include <memory>
5
+ #include <adf.h>
6
+
7
+
8
+ // Declare Kernel functions and initializers
9
+ void superkernel_conv2d_dwc(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
10
+ void superkernel_conv_eltbinary(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,const unsigned int (&)[17],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
11
+ void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
12
+
13
+ // Declare Kernel objects and external arrays
14
+
15
+
16
+ void _b919_wrapper(void* args[])
17
+ {
18
+ superkernel_conv2d_dwc(
19
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
20
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
21
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
22
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
23
+ }
24
+
25
+ void _b924_wrapper(void* args[])
26
+ {
27
+ superkernel_conv_eltbinary(
28
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
29
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
30
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]),
31
+ *reinterpret_cast<uint32 const(*)[17]>(args[4]),
32
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[3]));
33
+ }
34
+
35
+ void _b896_wrapper(void* args[])
36
+ {
37
+ conv2d_maxpool(
38
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
39
+ *reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
40
+ *reinterpret_cast<uint32 const(*)[16]>(args[3]),
41
+ *reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
42
+ }
43
+
44
+ using UniformKernelFunc = void (*)(void **);
45
+
46
+ static UniformKernelFunc g_uniformKernelFuncs[3] = {
47
+ _b919_wrapper,
48
+ _b924_wrapper,
49
+ _b896_wrapper
50
+ };
51
+
52
+ __attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
53
+ {
54
+ uint32 idx = 0;
55
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
56
+ idx += (numSyncIn > 0) ? 1 : 0;
57
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
58
+ idx += (numSyncIn > 1) ? 1 : 0;
59
+ idx += numAsyncIn;
60
+
61
+ (*(g_uniformKernelFuncs[kernelId]))(args);
62
+
63
+ idx = 0;
64
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
65
+ idx += (numSyncIn > 0) ? 1 : 0;
66
+ reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
67
+ idx += (numSyncIn > 1) ? 1 : 0;
68
+ idx += numAsyncIn;
69
+ }
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/timestamped_log/0_0_reloadable1.log ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable1/xlopt.log ADDED
@@ -0,0 +1,402 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ERROR: ld.so: object '/lib64/libudev.so.1' from LD_PRELOAD cannot be preloaded (cannot open shared object file): ignored.
2
+
3
+
4
+ --------------- FILTER ANALYSIS INFO LOG ---------------
5
+
6
+ Reading Header IR from ir/_header.ll
7
+
8
+ --------------------------------------------------------
9
+
10
+ Add module pass 363{anonymous}::GuidancePass
11
+ Add module pass 363{anonymous}::ChessOptionsPass
12
+ Add module pass 363{anonymous}::DisableInliningInMainPass
13
+ Add module pass 363cdno::xlopt::AIEMergeSubWordStoresOpt
14
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::PromotePass>
15
+ Add module pass 363{anonymous}::IpConstPropPass
16
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::SimplifyCFGPass>
17
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::LoopSimplifyPass>
18
+ Add module pass 363{anonymous}::XLModuleAdaptor<llvm::FunctionToLoopPassAdaptor>
19
+ Add module pass 363{anonymous}::XLModuleAdaptor<{anonymous}::AIELoopInfoPass>
20
+ Add module pass 363cdno::xlopt::AIEAnnotatePragmaPass
21
+ Add module pass 363{anonymous}::XLModuleAdaptor<{anonymous}::AIELoopPeelPass>
22
+ Add module pass 363{anonymous}::AIEAliasAnalysisPass
23
+
24
+
25
+ --------------- MEMORY MANAGEMENT GUIDANCE LOG ---------------
26
+
27
+ ALIGNMENT_HINT: Alignment of global array g_uniformKernelFuncs is 4 bytes; automatically aligning it to 64 bytes.
28
+ SIZE_HINT: Global array sigmoid_lut<0u, 256u>::data_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
29
+ SIZE_HINT: Global array sigmoid_lut<0u, 256u>::data_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
30
+ SIZE_HINT: Global array gelu_lut_32<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
31
+ SIZE_HINT: Global array gelu_lut_32<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
32
+ SIZE_HINT: Global array tanh_lut<0u, 512u>::data_ab is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
33
+ SIZE_HINT: Global array tanh_lut<0u, 512u>::data_cd is 2048 bytes. Consider making it mapper-managed LUT or memory buffer.
34
+ SIZE_HINT: Global array log_f32_lut<256u>::fraction_table_ab_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
35
+ SIZE_HINT: Global array log_f32_lut<256u>::fraction_table_cd_f32 is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
36
+ SIZE_HINT: Global array exp2_lut<512u>::exp2_table_ab is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
37
+ SIZE_HINT: Global array exp2_lut<512u>::exp2_table_cd is 1024 bytes. Consider making it mapper-managed LUT or memory buffer.
38
+
39
+ --------------------------------------------------------------
40
+
41
+
42
+
43
+ --------------- MERGING SUBWORD STORES OPT LOG ---------------
44
+
45
+
46
+
47
+ --------------- LOOP STATISTICS : _ZN18conv2d_bf16_paramsC2Ev ---------------
48
+
49
+ Total loops = 1
50
+ Loops with prepare for pipelining pragma = 0
51
+ Loops with unroll pragma = 0
52
+ Loops with flatten pragma = 0
53
+ Loops with min range pragma = 0
54
+ Loops with max range pragma = 0
55
+ Loops with known trip count = 0
56
+
57
+ -----------------------------------------------------------------------------
58
+
59
+
60
+
61
+ --------------- LOOP STATISTICS : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh ---------------
62
+
63
+ Total loops = 1
64
+ Loops with prepare for pipelining pragma = 0
65
+ Loops with unroll pragma = 0
66
+ Loops with flatten pragma = 0
67
+ Loops with min range pragma = 0
68
+ Loops with max range pragma = 0
69
+ Loops with known trip count = 1
70
+
71
+ -------------------------------------------------------------------------------------------------------------------
72
+
73
+
74
+
75
+ --------------- LOOP STATISTICS : _Z14conv2d_genericILh1EL5act_t0ELb0ELb1ELb0E8bfloat16EvPS1_S2_S2_S2_R18conv2d_bf16_params10out_mode_t ---------------
76
+
77
+ Total loops = 4
78
+ Loops with prepare for pipelining pragma = 4
79
+ Loops with unroll pragma = 0
80
+ Loops with flatten pragma = 0
81
+ Loops with min range pragma = 4
82
+ Loops with max range pragma = 0
83
+ Loops with known trip count = 0
84
+
85
+ -------------------------------------------------------------------------------------------------------------------------------------------------------
86
+
87
+
88
+
89
+ --------------- LOOP STATISTICS : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams ---------------
90
+
91
+ Total loops = 1
92
+ Loops with prepare for pipelining pragma = 1
93
+ Loops with unroll pragma = 0
94
+ Loops with flatten pragma = 0
95
+ Loops with min range pragma = 1
96
+ Loops with max range pragma = 0
97
+ Loops with known trip count = 0
98
+
99
+ -------------------------------------------------------------------------------------------------------------------
100
+
101
+
102
+
103
+ --------------- LOOP STATISTICS : _ZN31elementwise_binary_broadcastingI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E ---------------
104
+
105
+ Total loops = 1
106
+ Loops with prepare for pipelining pragma = 1
107
+ Loops with unroll pragma = 0
108
+ Loops with flatten pragma = 0
109
+ Loops with min range pragma = 1
110
+ Loops with max range pragma = 0
111
+ Loops with known trip count = 0
112
+
113
+ ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
114
+
115
+
116
+
117
+ --------------- LOOP STATISTICS : _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj32EEELj2EEC2Ev ---------------
118
+
119
+ Total loops = 1
120
+ Loops with prepare for pipelining pragma = 0
121
+ Loops with unroll pragma = 0
122
+ Loops with flatten pragma = 0
123
+ Loops with min range pragma = 0
124
+ Loops with max range pragma = 0
125
+ Loops with known trip count = 0
126
+
127
+ --------------------------------------------------------------------------------------------------------
128
+
129
+
130
+
131
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1616elementwise_clipIS0_E20clip_internal_paramsIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
132
+
133
+ Total loops = 1
134
+ Loops with prepare for pipelining pragma = 1
135
+ Loops with unroll pragma = 0
136
+ Loops with flatten pragma = 0
137
+ Loops with min range pragma = 1
138
+ Loops with max range pragma = 0
139
+ Loops with known trip count = 0
140
+
141
+ -----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
142
+
143
+
144
+
145
+ --------------- LOOP STATISTICS : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE ---------------
146
+
147
+ Total loops = 1
148
+ Loops with prepare for pipelining pragma = 1
149
+ Loops with unroll pragma = 0
150
+ Loops with flatten pragma = 0
151
+ Loops with min range pragma = 1
152
+ Loops with max range pragma = 0
153
+ Loops with known trip count = 0
154
+
155
+ ---------------------------------------------------------------------------------------------------------------------------------------------------------------
156
+
157
+
158
+
159
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
160
+
161
+ Total loops = 1
162
+ Loops with prepare for pipelining pragma = 1
163
+ Loops with unroll pragma = 0
164
+ Loops with flatten pragma = 0
165
+ Loops with min range pragma = 1
166
+ Loops with max range pragma = 0
167
+ Loops with known trip count = 0
168
+
169
+ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
170
+
171
+
172
+
173
+ --------------- LOOP STATISTICS : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E ---------------
174
+
175
+ Total loops = 1
176
+ Loops with prepare for pipelining pragma = 1
177
+ Loops with unroll pragma = 0
178
+ Loops with flatten pragma = 0
179
+ Loops with min range pragma = 1
180
+ Loops with max range pragma = 0
181
+ Loops with known trip count = 0
182
+
183
+ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
184
+
185
+
186
+
187
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj32EEC2Eb ---------------
188
+
189
+ Total loops = 2
190
+ Loops with prepare for pipelining pragma = 0
191
+ Loops with unroll pragma = 2
192
+ Loops with flatten pragma = 0
193
+ Loops with min range pragma = 0
194
+ Loops with max range pragma = 0
195
+ Loops with known trip count = 2
196
+
197
+ -------------------------------------------------------------------------
198
+
199
+
200
+
201
+ --------------- LOOP STATISTICS : _Z9avgpool2dILh1E8bfloat16Qsr5mllib5utilsE11is_one_of_vIT0_ahS0_EEvPS1_S2_R25avgpool2d_internal_paramsIS1_E ---------------
202
+
203
+ Total loops = 1
204
+ Loops with prepare for pipelining pragma = 1
205
+ Loops with unroll pragma = 0
206
+ Loops with flatten pragma = 0
207
+ Loops with min range pragma = 1
208
+ Loops with max range pragma = 0
209
+ Loops with known trip count = 0
210
+
211
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------
212
+
213
+
214
+
215
+ --------------- LOOP STATISTICS : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E ---------------
216
+
217
+ Total loops = 1
218
+ Loops with prepare for pipelining pragma = 1
219
+ Loops with unroll pragma = 0
220
+ Loops with flatten pragma = 0
221
+ Loops with min range pragma = 1
222
+ Loops with max range pragma = 0
223
+ Loops with known trip count = 0
224
+
225
+ ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------
226
+
227
+
228
+
229
+ --------------- LOOP STATISTICS : _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh ---------------
230
+
231
+ Total loops = 1
232
+ Loops with prepare for pipelining pragma = 0
233
+ Loops with unroll pragma = 0
234
+ Loops with flatten pragma = 0
235
+ Loops with min range pragma = 0
236
+ Loops with max range pragma = 0
237
+ Loops with known trip count = 1
238
+
239
+ --------------------------------------------------------------------------------------------------------------
240
+
241
+
242
+
243
+ --------------- LOOP STATISTICS : _Z9conv2d_dwILh1E8bfloat16S0_S0_N3adf16io_buffer_configINS1_7extentsIJEEENS1_7locking4syncENS1_10addressing6linearENS1_6marginILj0EEEEESB_NS2_IS4_NS5_5asyncES8_SA_EEQsr3stdE9is_same_vIT0_S0_EEvRNS1_9io_bufferISE_NS1_9direction2inET3_EERNSF_IT1_SH_T4_EERNSF_IT2_NSG_3outET5_EER21conv2d_dw_bf16_params ---------------
244
+
245
+ Total loops = 2
246
+ Loops with prepare for pipelining pragma = 2
247
+ Loops with unroll pragma = 0
248
+ Loops with flatten pragma = 0
249
+ Loops with min range pragma = 2
250
+ Loops with max range pragma = 0
251
+ Loops with known trip count = 0
252
+
253
+ -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
254
+
255
+
256
+
257
+ --------------- LOOP STATISTICS : _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E ---------------
258
+
259
+ Total loops = 2
260
+ Loops with prepare for pipelining pragma = 1
261
+ Loops with unroll pragma = 0
262
+ Loops with flatten pragma = 0
263
+ Loops with min range pragma = 1
264
+ Loops with max range pragma = 0
265
+ Loops with known trip count = 0
266
+
267
+ ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
268
+
269
+
270
+
271
+ --------------- LOOP STATISTICS : _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj16EEELj4EEC2Ev ---------------
272
+
273
+ Total loops = 1
274
+ Loops with prepare for pipelining pragma = 0
275
+ Loops with unroll pragma = 0
276
+ Loops with flatten pragma = 0
277
+ Loops with min range pragma = 0
278
+ Loops with max range pragma = 0
279
+ Loops with known trip count = 0
280
+
281
+ --------------------------------------------------------------------------------------------------------
282
+
283
+
284
+
285
+ --------------- LOOP STATISTICS : _ZN19reduce_mean_c8_implI8bfloat16E16body_postprocessEPvR18reduce_c8_params_tI23reduce_mean_c8_params_tIS0_EE ---------------
286
+
287
+ Total loops = 2
288
+ Loops with prepare for pipelining pragma = 2
289
+ Loops with unroll pragma = 0
290
+ Loops with flatten pragma = 0
291
+ Loops with min range pragma = 2
292
+ Loops with max range pragma = 0
293
+ Loops with known trip count = 0
294
+
295
+ ---------------------------------------------------------------------------------------------------------------------------------------------------------------
296
+
297
+
298
+
299
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj8EEC2Eb ---------------
300
+
301
+ Total loops = 2
302
+ Loops with prepare for pipelining pragma = 0
303
+ Loops with unroll pragma = 2
304
+ Loops with flatten pragma = 0
305
+ Loops with min range pragma = 0
306
+ Loops with max range pragma = 0
307
+ Loops with known trip count = 2
308
+
309
+ ------------------------------------------------------------------------
310
+
311
+
312
+
313
+ --------------- LOOP STATISTICS : _ZN3aie4maskILj16EEC2Eb ---------------
314
+
315
+ Total loops = 2
316
+ Loops with prepare for pipelining pragma = 0
317
+ Loops with unroll pragma = 2
318
+ Loops with flatten pragma = 0
319
+ Loops with min range pragma = 0
320
+ Loops with max range pragma = 0
321
+ Loops with known trip count = 2
322
+
323
+ -------------------------------------------------------------------------
324
+
325
+
326
+
327
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj8EEeqERKS1_ ---------------
328
+
329
+ Total loops = 1
330
+ Loops with prepare for pipelining pragma = 0
331
+ Loops with unroll pragma = 1
332
+ Loops with flatten pragma = 0
333
+ Loops with min range pragma = 0
334
+ Loops with max range pragma = 0
335
+ Loops with known trip count = 1
336
+
337
+ -----------------------------------------------------------------------------
338
+
339
+
340
+
341
+ --------------- LOOP STATISTICS : _ZNK3aie4maskILj16EEeqERKS1_ ---------------
342
+
343
+ Total loops = 1
344
+ Loops with prepare for pipelining pragma = 0
345
+ Loops with unroll pragma = 1
346
+ Loops with flatten pragma = 0
347
+ Loops with min range pragma = 0
348
+ Loops with max range pragma = 0
349
+ Loops with known trip count = 1
350
+
351
+ ------------------------------------------------------------------------------
352
+
353
+
354
+
355
+ --------------- LOOP STATISTICS : _Z26pad_3d_bfloat16_simplifiedP8bfloat16S0_R15pad_3d_params_t ---------------
356
+
357
+ Total loops = 3
358
+ Loops with prepare for pipelining pragma = 0
359
+ Loops with unroll pragma = 0
360
+ Loops with flatten pragma = 0
361
+ Loops with min range pragma = 0
362
+ Loops with max range pragma = 0
363
+ Loops with known trip count = 0
364
+
365
+ ---------------------------------------------------------------------------------------------------------------
366
+
367
+
368
+
369
+ --------------- PRAGMA INSERTION LOG (unroll threshold = 3000, max unroll factor = 1) ---------------
370
+
371
+ Adding pragma to function _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh :
372
+ Pragma added to loop at line 437 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common/../../include/conv/conv2d_bf16_params.h : chess_loop_range(8,8)
373
+ Adding pragma to function _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj32EEELj2EEC2Ev :
374
+ Pragma added to loop at line 135 in file /usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite/../include/array : chess_prepare_for_pipelining
375
+ Adding pragma to function _ZN3aie4maskILj32EEC2Eb :
376
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
377
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
378
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
379
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
380
+ Adding pragma to function _ZL27setup_conv2d_dw_params_bf16PKjR21conv2d_dw_bf16_paramsh :
381
+ Pragma added to loop at line 214 in file /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common/../../include/conv/conv2d_dw_bf16_params.h : chess_loop_range(4,4)
382
+ Adding pragma to function _ZNSt3__25arrayIN3aie6vectorI8bfloat16Lj16EEELj4EEC2Ev :
383
+ Pragma added to loop at line 135 in file /usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite/../include/array : chess_prepare_for_pipelining
384
+ Adding pragma to function _ZN3aie4maskILj8EEC2Eb :
385
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
386
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
387
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
388
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
389
+ Adding pragma to function _ZN3aie4maskILj16EEC2Eb :
390
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
391
+ Pragma added to loop at line 122 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
392
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
393
+ Pragma added to loop at line 128 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
394
+ Adding pragma to function _ZNK3aie4maskILj16EEeqERKS1_ :
395
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
396
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
397
+ Adding pragma to function _ZNK3aie4maskILj8EEeqERKS1_ :
398
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_loop_range(1,1)
399
+ Pragma added to loop at line 249 in file /usr/local/lib/python3.10/dist-packages/include/aie_api/detail/aie2/../../mask.hpp : chess_flatten_loop
400
+
401
+ -----------------------------------------------------------------------------------------------------
402
+
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable10/Release/0_0_reloadable10.calltree ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ // File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:46:39 2025
3
+ // Copyright 2014-2024 Synopsys, Inc. All rights reserved.
4
+ // bridge -o../Release/0_0_reloadable2 ../Release/0_0_reloadable2.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable2.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork1731 -pme
5
+
6
+
7
+ // Release: ipp V-2024.06-TGT-241219
8
+
9
+ _Z13kernelWrapperPPvjjjj
10
+ _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
11
+ _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv
12
+ _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t
13
+ _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E
14
+ _ZN12me_primitive10udiv_dstepEjjRjS0_
15
+ _ZN12me_primitive10udiv_dstepEjjRjS0_ (*)
16
+ int32_to_float32
17
+ _ZL28normalizeRoundAndPackFloat32iij
18
+ _ZL19roundAndPackFloat32iij
19
+ float32_add
20
+ _ZL14addFloat32Sigsjji
21
+ _ZL19propagateFloat32NaNjj
22
+ _ZL19roundAndPackFloat32iij (*)
23
+ _ZL14subFloat32Sigsjji
24
+ _ZL19propagateFloat32NaNjj (*)
25
+ _ZL28normalizeRoundAndPackFloat32iij (*)
26
+
27
+
28
+ Call tree stack and functions sizes:
29
+
30
+ stack stack stack call func func function name
31
+ desc level level desc
32
+ ----- ----- ----- ----- ----- ----- --------------------------------------------------------------
33
+ 64 448 0 0 220 10058 _Z13kernelWrapperPPvjjjj
34
+ 128 384 1 1 2676 9838 _Z26superkernel_reduce_mean_c8RN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
35
+ 64 64 2 2 1588 1588 _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE5setupER18reduce_c8_params_tIS4_EPKv
36
+ 0 0 2 2 670 670 _Z6pad_3dIL11pad_3d_mode0E8bfloat16Li1EEvPT0_S3_R15pad_3d_params_t
37
+ 256 256 2 2 2680 2822 _ZN18reduce_skeleton_c8I8bfloat1619reduce_mean_c8_implIS0_E23reduce_mean_c8_params_tIS0_EE3runEPS0_S6_R18reduce_c8_params_tIS4_E
38
+ 0 0 3 3 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
39
+ 0 0 2 2 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
40
+ 0 0 2 2 114 530 int32_to_float32
41
+ 0 0 2 3 24 416 _ZL28normalizeRoundAndPackFloat32iij <tail call>
42
+ 0 0 2 4 392 392 _ZL19roundAndPackFloat32iij <tail call>
43
+ 0 0 2 2 64 1968 float32_add
44
+ 0 0 3 3 624 1128 _ZL14addFloat32Sigsjji
45
+ 0 0 4 4 112 112 _ZL19propagateFloat32NaNjj
46
+ 0 0 3 4 392 392 _ZL19roundAndPackFloat32iij <tail call>
47
+ 0 0 2 3 752 1280 _ZL14subFloat32Sigsjji <tail call>
48
+ 0 0 3 4 112 112 _ZL19propagateFloat32NaNjj
49
+ 0 0 2 4 24 416 _ZL28normalizeRoundAndPackFloat32iij <tail call> (*)
50
+
51
+
52
+ Maximum call level : 4
53
+ Maximum stack level: 4
54
+ Maximum stack size : 448
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable10/Release/0_0_reloadable10.cmic2 ADDED
The diff for this file is too large to render. See raw diff
 
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0_reloadable10/Release/0_0_reloadable10.cmico ADDED
@@ -0,0 +1 @@
 
 
1
+ +Mdec