Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_30.bin +3 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_32.bin +3 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_33.bin +3 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_34.bin +3 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_35.bin +3 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_36.bin +3 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_39.bin +3 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.cmic2 +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.cmico +1 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.lst +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.map +270 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.sdr +120 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.srv +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.txt +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/scripts/0_2_reloadable21.bcf +16 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/scripts/0_2_reloadable21.prx +13 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/src/0_2_reloadable21.cc +99 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.calltree +56 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.cmic2 +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.cmico +1 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.lst +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.map +202 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.sdr +105 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.srv +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.txt +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/scripts/0_2_reloadable22.bcf +16 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/scripts/0_2_reloadable22.prx +13 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/src/0_2_reloadable22.cc +81 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.calltree +92 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.cmic2 +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.cmico +1 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.lst +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.map +296 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.sdr +125 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.srv +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.txt +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/scripts/0_2_reloadable23.bcf +16 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/scripts/0_2_reloadable23.prx +13 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/src/0_2_reloadable23.cc +124 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.calltree +88 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.cmic2 +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.cmico +1 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.lst +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.map +294 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.sdr +125 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.srv +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.txt +0 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/scripts/0_2_reloadable24.bcf +16 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/scripts/0_2_reloadable24.prx +13 -0
- segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/src/0_2_reloadable24.cc +113 -0
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10fe86e880716f51f9b88c3bfd1f1a3a2a6bf5d80aa35a23fe02afc67a0bf8ce
|
3 |
+
size 384
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8fec3a09bf7510cd8ce1ab86c293d7b466805391ace22f6b975a073c96e6e03
|
3 |
+
size 296
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:541b329c484a094eeac656452e18f0be0816bb2438bdfd19f8ad1e0a9b3b9cc3
|
3 |
+
size 296
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fb9253ded0289c5b796164e40201bd8f5d660b2373d91b5b58eb314375af7e7
|
3 |
+
size 296
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ae43a8dcc0cd99130f42249d4f2a9f1fc91c3c99699db65bb98ad360a326ef6
|
3 |
+
size 376
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f160f47a8817f836489ba77f94fd815c17526fb3448a8ce9f2c7e6a14630ebe2
|
3 |
+
size 516
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_0/lcp/0_0_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e42c0244a6c7c553df9a202c9f4762ed90bbf1ab021b2d8875c10215fa23db09
|
3 |
+
size 296
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.cmic2
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.cmico
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
+Mdec
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.lst
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.map
ADDED
@@ -0,0 +1,270 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:57:04 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable21 ../Release/0_0_reloadable21.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable21.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork5877 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
Memory map for memory 'DM_stack':
|
9 |
+
|
10 |
+
Size = 1048576
|
11 |
+
Width = 8 bits
|
12 |
+
Offset = 0
|
13 |
+
Used = 2368
|
14 |
+
|
15 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
16 |
+
|
17 |
+
Memory map for memory 'DMb':
|
18 |
+
|
19 |
+
Size = 1048576
|
20 |
+
Width = 8 bits
|
21 |
+
Offset = 0
|
22 |
+
Used = 3197
|
23 |
+
|
24 |
+
0x00000000..0x0007babf ( 506560 items) : Reserved
|
25 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
26 |
+
0x0007c400..0x0007c43f ( 64 items) : Reserved
|
27 |
+
0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable21.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
|
28 |
+
0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable21.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
|
29 |
+
0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable21.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
|
30 |
+
0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable21.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
|
31 |
+
0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable21.o::_ZL8core_row (Data, Local, .bss.DMb.4)
|
32 |
+
0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable21.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
|
33 |
+
0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable21.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
|
34 |
+
0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable21.o::_ZL8num_iter (Data, Local, .data.DMb.4)
|
35 |
+
0x0007c460..0x0007c463 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
|
36 |
+
0x0007c464..0x0007c464 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
|
37 |
+
0x0007c480..0x0007c497 ( 24 items) : ../Release/0_0_reloadable21.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
|
38 |
+
|
39 |
+
Called functions : _Z14_b1638_wrapperPPv
|
40 |
+
_Z14_b1655_wrapperPPv
|
41 |
+
_Z13_b891_wrapperPPv
|
42 |
+
_Z13_b896_wrapperPPv
|
43 |
+
_Z14_b1672_wrapperPPv
|
44 |
+
_Z13_b886_wrapperPPv
|
45 |
+
|
46 |
+
0x0007c4c0..0x0007c4ff ( 64 items) : ../Release/0_0_reloadable21.o::add1d_params (Data, Global, .bss.DMb.64)
|
47 |
+
0x0007c500..0x0007c53f ( 64 items) : ../Release/0_0_reloadable21.o::mul1d_params (Data, Global, .bss.DMb.64)
|
48 |
+
0x0007c540..0x0007c57f ( 64 items) : ../Release/0_0_reloadable21.o::sub1d_params (Data, Global, .bss.DMb.64)
|
49 |
+
0x0007c580..0x0007c5bf ( 64 items) : ../Release/0_0_reloadable21.o::sigmoid1d_params (Data, Global, .bss.DMb.64)
|
50 |
+
0x0007c5c0..0x0007c5ff ( 64 items) : ../Release/0_0_reloadable21.o::tanh1d_params (Data, Global, .bss.DMb.64)
|
51 |
+
0x0007c600..0x0007c7bf ( 448 items) : ../Release/0_0_reloadable21.o::conv2d_params (Data, Global, .bss.DMb.64)
|
52 |
+
0x0007ccc0..0x000fffff ( 537408 items) : Reserved
|
53 |
+
|
54 |
+
Memory map for memory 'PM':
|
55 |
+
|
56 |
+
Size = 1048576
|
57 |
+
Width = 8 bits
|
58 |
+
Offset = 0
|
59 |
+
Used = 10946
|
60 |
+
|
61 |
+
0x00000000..0x0000092f ( 2352 items) : Reserved
|
62 |
+
0x00000930..0x00000ab5 ( 390 items) : ../Release/0_0_reloadable21.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
|
63 |
+
|
64 |
+
Referenced symbols: _ZL20g_uniformKernelFuncs
|
65 |
+
|
66 |
+
0x00000ac0..0x00001055 ( 1430 items) : ../Release/0_0_reloadable21.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
|
67 |
+
0x00001060..0x0000116d ( 270 items) : ../Release/0_0_reloadable21.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
|
68 |
+
|
69 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
70 |
+
|
71 |
+
0x00001170..0x00001ad9 ( 2410 items) : ../Release/0_0_reloadable21.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
|
72 |
+
|
73 |
+
Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
74 |
+
|
75 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
76 |
+
|
77 |
+
0x00001ae0..0x00001d17 ( 568 items) : ../Release/0_0_reloadable21.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
78 |
+
|
79 |
+
Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
80 |
+
_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
81 |
+
|
82 |
+
Referenced symbols: _ZL9curr_iter
|
83 |
+
conv2d_params
|
84 |
+
_ZN12me_primitive11control_rndE
|
85 |
+
_ZN12me_primitive11control_satE
|
86 |
+
_ZL14num_depth_iter
|
87 |
+
_ZL8num_iter
|
88 |
+
_ZL10depth_iter
|
89 |
+
_ZL11total_iters
|
90 |
+
|
91 |
+
0x00001d20..0x00001f35 ( 534 items) : ../Release/0_0_reloadable21.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
|
92 |
+
|
93 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
94 |
+
|
95 |
+
0x00001f40..0x00001f7d ( 62 items) : ../Release/0_0_reloadable21.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
96 |
+
0x00001f80..0x000020f9 ( 378 items) : ../Release/0_0_reloadable21.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
97 |
+
|
98 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
99 |
+
|
100 |
+
0x00002100..0x000022e7 ( 488 items) : ../Release/0_0_reloadable21.o::_Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
101 |
+
|
102 |
+
Called functions : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
103 |
+
_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
104 |
+
|
105 |
+
Referenced symbols: _ZL9curr_iter
|
106 |
+
_ZL8core_row
|
107 |
+
sigmoid1d_params
|
108 |
+
_ZN12me_primitive11control_rndE
|
109 |
+
_ZN12me_primitive11control_satE
|
110 |
+
_ZL11ifm1_offset
|
111 |
+
_ZL8num_iter
|
112 |
+
|
113 |
+
0x000022f0..0x0000232d ( 62 items) : ../Release/0_0_reloadable21.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
114 |
+
0x00002330..0x000026f1 ( 962 items) : ../Release/0_0_reloadable21.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 384)
|
115 |
+
|
116 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
117 |
+
|
118 |
+
0x00002700..0x000028e7 ( 488 items) : ../Release/0_0_reloadable21.o::_Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
119 |
+
|
120 |
+
Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
121 |
+
_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
122 |
+
|
123 |
+
Referenced symbols: _ZL9curr_iter
|
124 |
+
_ZL8core_row
|
125 |
+
tanh1d_params
|
126 |
+
_ZN12me_primitive11control_rndE
|
127 |
+
_ZN12me_primitive11control_satE
|
128 |
+
_ZL11ifm1_offset
|
129 |
+
_ZL8num_iter
|
130 |
+
|
131 |
+
0x000028f0..0x00002963 ( 116 items) : ../Release/0_0_reloadable21.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
|
132 |
+
0x00002970..0x000029d1 ( 98 items) : ../Release/0_0_reloadable21.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
|
133 |
+
|
134 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
|
135 |
+
|
136 |
+
0x000029e0..0x000029ef ( 16 items) : ../Release/0_0_reloadable21.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
|
137 |
+
|
138 |
+
Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
139 |
+
|
140 |
+
0x000029f0..0x00002c49 ( 602 items) : ../Release/0_0_reloadable21.o::_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
141 |
+
|
142 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
|
143 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
|
144 |
+
|
145 |
+
Referenced symbols: _ZL9curr_iter
|
146 |
+
_ZL8core_row
|
147 |
+
add1d_params
|
148 |
+
_ZN12me_primitive11control_rndE
|
149 |
+
_ZN12me_primitive11control_satE
|
150 |
+
_ZL11ifm1_offset
|
151 |
+
_ZL11ifm2_offset
|
152 |
+
_ZL8num_iter
|
153 |
+
|
154 |
+
0x00002c50..0x00002c67 ( 24 items) : ../Release/0_0_reloadable21.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
155 |
+
0x00002c70..0x00002cf9 ( 138 items) : ../Release/0_0_reloadable21.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
|
156 |
+
|
157 |
+
Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
|
158 |
+
|
159 |
+
0x00002d00..0x00002e23 ( 292 items) : ../Release/0_0_reloadable21.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
160 |
+
|
161 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
162 |
+
|
163 |
+
0x00002e30..0x00003089 ( 602 items) : ../Release/0_0_reloadable21.o::_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
164 |
+
|
165 |
+
Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
|
166 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
|
167 |
+
|
168 |
+
Referenced symbols: _ZL9curr_iter
|
169 |
+
_ZL8core_row
|
170 |
+
mul1d_params
|
171 |
+
_ZN12me_primitive11control_rndE
|
172 |
+
_ZN12me_primitive11control_satE
|
173 |
+
_ZL11ifm1_offset
|
174 |
+
_ZL11ifm2_offset
|
175 |
+
_ZL8num_iter
|
176 |
+
|
177 |
+
0x00003090..0x00003103 ( 116 items) : ../Release/0_0_reloadable21.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
178 |
+
0x00003110..0x00003159 ( 74 items) : ../Release/0_0_reloadable21.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
|
179 |
+
|
180 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
|
181 |
+
|
182 |
+
0x00003160..0x0000316f ( 16 items) : ../Release/0_0_reloadable21.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
183 |
+
|
184 |
+
Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
185 |
+
|
186 |
+
0x00003170..0x000033c9 ( 602 items) : ../Release/0_0_reloadable21.o::_Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
187 |
+
|
188 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
|
189 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
|
190 |
+
|
191 |
+
Referenced symbols: _ZL9curr_iter
|
192 |
+
_ZL8core_row
|
193 |
+
sub1d_params
|
194 |
+
_ZN12me_primitive11control_rndE
|
195 |
+
_ZN12me_primitive11control_satE
|
196 |
+
_ZL11ifm1_offset
|
197 |
+
_ZL11ifm2_offset
|
198 |
+
_ZL8num_iter
|
199 |
+
|
200 |
+
0x000033d0..0x000033ef ( 32 items) : ../Release/0_0_reloadable21.o::_Z14_b1638_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
201 |
+
|
202 |
+
Called functions : _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
203 |
+
|
204 |
+
0x000033f0..0x00003413 ( 36 items) : ../Release/0_0_reloadable21.o::_Z14_b1655_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
205 |
+
|
206 |
+
Called functions : _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
207 |
+
|
208 |
+
0x00003420..0x00003443 ( 36 items) : ../Release/0_0_reloadable21.o::_Z13_b891_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
209 |
+
|
210 |
+
Called functions : _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
211 |
+
|
212 |
+
0x00003450..0x00003473 ( 36 items) : ../Release/0_0_reloadable21.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
213 |
+
|
214 |
+
Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
215 |
+
|
216 |
+
0x00003480..0x0000349f ( 32 items) : ../Release/0_0_reloadable21.o::_Z14_b1672_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
217 |
+
|
218 |
+
Called functions : _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
219 |
+
|
220 |
+
0x000034a0..0x000034c3 ( 36 items) : ../Release/0_0_reloadable21.o::_Z13_b886_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
221 |
+
|
222 |
+
Called functions : _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
223 |
+
|
224 |
+
|
225 |
+
External symbols:
|
226 |
+
|
227 |
+
__dso_handle = 0x0
|
228 |
+
_ctors_end = 0x0
|
229 |
+
_ctors_start = 0x0
|
230 |
+
_dtors_end = 0x0
|
231 |
+
_dtors_start = 0x0
|
232 |
+
_pc_end = 0x34c4
|
233 |
+
_pc_start = 0x930
|
234 |
+
_sp_end_DM_stack = 0x7c400
|
235 |
+
_sp_start_DM_stack = 0x7bac0
|
236 |
+
|
237 |
+
Section summary for memory 'DM_stack':
|
238 |
+
|
239 |
+
.stack File
|
240 |
+
---------- ----------
|
241 |
+
2368
|
242 |
+
---------- ----------
|
243 |
+
2368 Total
|
244 |
+
|
245 |
+
Section summary for memory 'DMb':
|
246 |
+
|
247 |
+
.bss .data .rodata File
|
248 |
+
---------- ---------- ---------- ----------
|
249 |
+
796 4 24 ../Release/0_0_reloadable21.o
|
250 |
+
5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
251 |
+
---------- ---------- ---------- ----------
|
252 |
+
801 4 24 Total
|
253 |
+
|
254 |
+
Section summary for memory 'PM':
|
255 |
+
|
256 |
+
.text File
|
257 |
+
---------- ----------
|
258 |
+
10946 ../Release/0_0_reloadable21.o
|
259 |
+
---------- ----------
|
260 |
+
10946 Total
|
261 |
+
|
262 |
+
File summary:
|
263 |
+
|
264 |
+
../Release/0_0_reloadable21.o
|
265 |
+
DMb 824
|
266 |
+
PM 10946
|
267 |
+
|
268 |
+
me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
269 |
+
DMb 5
|
270 |
+
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.sdr
ADDED
@@ -0,0 +1,120 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 03:57:04 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable21 ../Release/0_0_reloadable21.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable21.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork5877 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
// Symbols in memory 'DM_bankA':
|
9 |
+
// Symbols in memory 'DM_bankAB':
|
10 |
+
// Symbols in memory 'DM_bankAC':
|
11 |
+
// Symbols in memory 'DM_bankAD':
|
12 |
+
// Symbols in memory 'DM_bankB':
|
13 |
+
// Symbols in memory 'DM_bankBC':
|
14 |
+
// Symbols in memory 'DM_bankBD':
|
15 |
+
// Symbols in memory 'DM_bankC':
|
16 |
+
// Symbols in memory 'DM_bankCD':
|
17 |
+
// Symbols in memory 'DM_bankD':
|
18 |
+
// Symbols in memory 'DM_stack':
|
19 |
+
// Symbols in memory 'DM_test':
|
20 |
+
// Symbols in memory 'DMb':
|
21 |
+
_symbol _ZN12me_primitive11control_satE 0x0007c460
|
22 |
+
_symbol _ZN12me_primitive11control_rndE 0x0007c464
|
23 |
+
_symbol add1d_params 0x0007c4c0
|
24 |
+
_symbol mul1d_params 0x0007c500
|
25 |
+
_symbol sub1d_params 0x0007c540
|
26 |
+
_symbol sigmoid1d_params 0x0007c580
|
27 |
+
_symbol tanh1d_params 0x0007c5c0
|
28 |
+
_symbol conv2d_params 0x0007c600
|
29 |
+
// Symbols in memory 'DMh':
|
30 |
+
// Symbols in memory 'DMh_bankA':
|
31 |
+
// Symbols in memory 'DMh_bankAB':
|
32 |
+
// Symbols in memory 'DMh_bankAC':
|
33 |
+
// Symbols in memory 'DMh_bankAD':
|
34 |
+
// Symbols in memory 'DMh_bankB':
|
35 |
+
// Symbols in memory 'DMh_bankBC':
|
36 |
+
// Symbols in memory 'DMh_bankBD':
|
37 |
+
// Symbols in memory 'DMh_bankC':
|
38 |
+
// Symbols in memory 'DMh_bankCD':
|
39 |
+
// Symbols in memory 'DMh_bankD':
|
40 |
+
// Symbols in memory 'DMh_stack':
|
41 |
+
// Symbols in memory 'DMs':
|
42 |
+
// Symbols in memory 'DMs_bankA':
|
43 |
+
// Symbols in memory 'DMs_bankAB':
|
44 |
+
// Symbols in memory 'DMs_bankAC':
|
45 |
+
// Symbols in memory 'DMs_bankAD':
|
46 |
+
// Symbols in memory 'DMs_bankB':
|
47 |
+
// Symbols in memory 'DMs_bankBC':
|
48 |
+
// Symbols in memory 'DMs_bankBD':
|
49 |
+
// Symbols in memory 'DMs_bankC':
|
50 |
+
// Symbols in memory 'DMs_bankCD':
|
51 |
+
// Symbols in memory 'DMs_bankD':
|
52 |
+
// Symbols in memory 'DMs_stack':
|
53 |
+
// Symbols in memory 'DMv':
|
54 |
+
// Symbols in memory 'DMv_bankA':
|
55 |
+
// Symbols in memory 'DMv_bankAB':
|
56 |
+
// Symbols in memory 'DMv_bankAC':
|
57 |
+
// Symbols in memory 'DMv_bankAD':
|
58 |
+
// Symbols in memory 'DMv_bankB':
|
59 |
+
// Symbols in memory 'DMv_bankBC':
|
60 |
+
// Symbols in memory 'DMv_bankBD':
|
61 |
+
// Symbols in memory 'DMv_bankC':
|
62 |
+
// Symbols in memory 'DMv_bankCD':
|
63 |
+
// Symbols in memory 'DMv_bankD':
|
64 |
+
// Symbols in memory 'DMv_stack':
|
65 |
+
// Symbols in memory 'DMw':
|
66 |
+
// Symbols in memory 'DMw_bankA':
|
67 |
+
// Symbols in memory 'DMw_bankAB':
|
68 |
+
// Symbols in memory 'DMw_bankAC':
|
69 |
+
// Symbols in memory 'DMw_bankAD':
|
70 |
+
// Symbols in memory 'DMw_bankB':
|
71 |
+
// Symbols in memory 'DMw_bankBC':
|
72 |
+
// Symbols in memory 'DMw_bankBD':
|
73 |
+
// Symbols in memory 'DMw_bankC':
|
74 |
+
// Symbols in memory 'DMw_bankCD':
|
75 |
+
// Symbols in memory 'DMw_bankD':
|
76 |
+
// Symbols in memory 'DMw_stack':
|
77 |
+
// Symbols in memory 'DMx':
|
78 |
+
// Symbols in memory 'DMx_bankA':
|
79 |
+
// Symbols in memory 'DMx_bankAB':
|
80 |
+
// Symbols in memory 'DMx_bankAC':
|
81 |
+
// Symbols in memory 'DMx_bankAD':
|
82 |
+
// Symbols in memory 'DMx_bankB':
|
83 |
+
// Symbols in memory 'DMx_bankBC':
|
84 |
+
// Symbols in memory 'DMx_bankBD':
|
85 |
+
// Symbols in memory 'DMx_bankC':
|
86 |
+
// Symbols in memory 'DMx_bankCD':
|
87 |
+
// Symbols in memory 'DMx_bankD':
|
88 |
+
// Symbols in memory 'DMx_stack':
|
89 |
+
// Symbols in memory 'PM':
|
90 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x00000930
|
91 |
+
_symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000ac0
|
92 |
+
_symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001060
|
93 |
+
_symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001170
|
94 |
+
_symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001ae0
|
95 |
+
_symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00001f40
|
96 |
+
_symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00001f80
|
97 |
+
_symbol _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002100
|
98 |
+
_symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x000022f0
|
99 |
+
_symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002330
|
100 |
+
_symbol _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00002700
|
101 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x000028f0
|
102 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00002970
|
103 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x000029e0
|
104 |
+
_symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x000029f0
|
105 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002c50
|
106 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002c70
|
107 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00002d00
|
108 |
+
_symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002e30
|
109 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00003090
|
110 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x00003110
|
111 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E 0x00003160
|
112 |
+
_symbol _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00003170
|
113 |
+
_symbol _Z14_b1638_wrapperPPv 0x000033d0
|
114 |
+
_symbol _Z14_b1655_wrapperPPv 0x000033f0
|
115 |
+
_symbol _Z13_b891_wrapperPPv 0x00003420
|
116 |
+
_symbol _Z13_b896_wrapperPPv 0x00003450
|
117 |
+
_symbol _Z14_b1672_wrapperPPv 0x00003480
|
118 |
+
_symbol _Z13_b886_wrapperPPv 0x000034a0
|
119 |
+
// Symbols in memory 'PMw':
|
120 |
+
// Symbols in memory 'TM4':
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.srv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/Release/0_2_reloadable21.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/scripts/0_2_reloadable21.bcf
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_reserved DMb 0x0 0x40000
|
2 |
+
|
3 |
+
_reserved PM 0x0 0x930 //reserved for main elf
|
4 |
+
|
5 |
+
_entry_point _Z13kernelWrapperPPvjjjj
|
6 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x930
|
7 |
+
|
8 |
+
_reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
|
9 |
+
_reserved DMb 0x7ba80 0x40 //reserved for sync buffer
|
10 |
+
_stack DM_stack 0x7bac0 0x940 //stack for core
|
11 |
+
_reserved DMb 0x7c400 0x40 //reserved for main elf heap
|
12 |
+
//space for synopsys compiler at 0x7c440 0x880//heap
|
13 |
+
_reserved DMb 0x40000 0x3b280
|
14 |
+
|
15 |
+
_reserved DMb 0x7ccc0 0x3340
|
16 |
+
_reserved DMb 0x80000 0x80000 // And everything else the core can't see
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/scripts/0_2_reloadable21.prx
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<project name="Project" processor="me">
|
2 |
+
<issinit/>
|
3 |
+
<option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
|
4 |
+
<option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
|
5 |
+
<option id="llvm.lang" value="Follow file extension"/>
|
6 |
+
<option id="bridge.cfg" value="0_2_reloadable21.bcf"/>
|
7 |
+
<option id="bridge.alibs" value=" ../Release/0_2_reloadable21.o" inherit="1" cfg="Release_LLVM"/>
|
8 |
+
<option id="cpp.include" value="<XILINX_VITIS_AIETOOLS>/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/<AIE_SRC_DIR> " inherit="1"/>
|
9 |
+
<option id="project.dir" value="<CONFIG>/0_2_reloadable21"/>
|
10 |
+
<option id="project.name" value="0_2_reloadable21"/>
|
11 |
+
<option id="project.type" value="exe"/>
|
12 |
+
<option id="simrun.issca" value="<XILINX_VITIS_AIETOOLS>/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
|
13 |
+
</project>
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable21/src/0_2_reloadable21.cc
ADDED
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
// Automatically generated processor driver using AIEngine tool-chain
|
2 |
+
|
3 |
+
#include <stdio.h>
|
4 |
+
#include <memory>
|
5 |
+
#include <adf.h>
|
6 |
+
|
7 |
+
|
8 |
+
// Declare Kernel functions and initializers
|
9 |
+
void superkernel_sigmoid1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
10 |
+
void superkernel_sub1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
11 |
+
void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
12 |
+
void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
13 |
+
void superkernel_tanh1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
14 |
+
void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
15 |
+
|
16 |
+
// Declare Kernel objects and external arrays
|
17 |
+
|
18 |
+
|
19 |
+
void _b1638_wrapper(void* args[])
|
20 |
+
{
|
21 |
+
superkernel_sigmoid1d(
|
22 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
23 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]),
|
24 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
|
25 |
+
}
|
26 |
+
|
27 |
+
void _b1655_wrapper(void* args[])
|
28 |
+
{
|
29 |
+
superkernel_sub1d(
|
30 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
31 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
32 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
33 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
34 |
+
}
|
35 |
+
|
36 |
+
void _b891_wrapper(void* args[])
|
37 |
+
{
|
38 |
+
superkernel_mul1d(
|
39 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
40 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
41 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
42 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
43 |
+
}
|
44 |
+
|
45 |
+
void _b896_wrapper(void* args[])
|
46 |
+
{
|
47 |
+
conv2d_maxpool(
|
48 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
49 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
50 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
51 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
52 |
+
}
|
53 |
+
|
54 |
+
void _b1672_wrapper(void* args[])
|
55 |
+
{
|
56 |
+
superkernel_tanh1d(
|
57 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
58 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]),
|
59 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
|
60 |
+
}
|
61 |
+
|
62 |
+
void _b886_wrapper(void* args[])
|
63 |
+
{
|
64 |
+
superkernel_add1d(
|
65 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
66 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
67 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
68 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
69 |
+
}
|
70 |
+
|
71 |
+
using UniformKernelFunc = void (*)(void **);
|
72 |
+
|
73 |
+
static UniformKernelFunc g_uniformKernelFuncs[6] = {
|
74 |
+
_b1638_wrapper,
|
75 |
+
_b1655_wrapper,
|
76 |
+
_b891_wrapper,
|
77 |
+
_b896_wrapper,
|
78 |
+
_b1672_wrapper,
|
79 |
+
_b886_wrapper
|
80 |
+
};
|
81 |
+
|
82 |
+
__attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
|
83 |
+
{
|
84 |
+
uint32 idx = 0;
|
85 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
|
86 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
87 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
|
88 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
89 |
+
idx += numAsyncIn;
|
90 |
+
|
91 |
+
(*(g_uniformKernelFuncs[kernelId]))(args);
|
92 |
+
|
93 |
+
idx = 0;
|
94 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
|
95 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
96 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
|
97 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
98 |
+
idx += numAsyncIn;
|
99 |
+
}
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.calltree
ADDED
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:00:39 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable22 ../Release/0_0_reloadable22.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable22.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6223 -pme
|
5 |
+
|
6 |
+
|
7 |
+
// Release: ipp V-2024.06-TGT-241219
|
8 |
+
|
9 |
+
_Z13kernelWrapperPPvjjjj
|
10 |
+
_Z13_b787_wrapperPPv (referenced text)
|
11 |
+
_ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
|
12 |
+
_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params
|
13 |
+
int32_to_float32
|
14 |
+
_ZL28normalizeRoundAndPackFloat32iij
|
15 |
+
_ZL19roundAndPackFloat32iij
|
16 |
+
_ZN12me_primitive10udiv_dstepEjjRjS0_
|
17 |
+
_Z13_b896_wrapperPPv (referenced text)
|
18 |
+
_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
19 |
+
_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
20 |
+
_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
21 |
+
_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
22 |
+
_Z13_b806_wrapperPPv (referenced text)
|
23 |
+
_ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
|
24 |
+
_Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
|
25 |
+
_Z13_b820_wrapperPPv (referenced text)
|
26 |
+
_ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj
|
27 |
+
|
28 |
+
|
29 |
+
Call tree stack and functions sizes:
|
30 |
+
|
31 |
+
stack stack stack call func func function name
|
32 |
+
desc level level desc
|
33 |
+
----- ----- ----- ----- ----- ----- --------------------------------------------------------------
|
34 |
+
64 1920 0 0 546 13462 _Z13kernelWrapperPPvjjjj
|
35 |
+
0 1856 1 1 32 5860 _Z13_b787_wrapperPPv
|
36 |
+
64 1856 1 2 1374 5828 _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj <tail call>
|
37 |
+
1792 1792 2 3 3782 4312 _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params
|
38 |
+
0 0 3 4 114 530 int32_to_float32
|
39 |
+
0 0 3 5 24 416 _ZL28normalizeRoundAndPackFloat32iij <tail call>
|
40 |
+
0 0 3 6 392 392 _ZL19roundAndPackFloat32iij <tail call>
|
41 |
+
0 0 2 3 142 142 _ZN12me_primitive10udiv_dstepEjjRjS0_
|
42 |
+
0 192 1 1 36 4714 _Z13_b896_wrapperPPv
|
43 |
+
64 192 1 2 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
|
44 |
+
64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
45 |
+
128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
46 |
+
0 0 3 4 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
47 |
+
0 192 1 1 32 1488 _Z13_b806_wrapperPPv
|
48 |
+
192 192 1 2 674 1456 _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj <tail call>
|
49 |
+
0 0 2 3 782 782 _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
|
50 |
+
0 0 1 1 36 854 _Z13_b820_wrapperPPv
|
51 |
+
0 0 1 2 818 818 _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj <tail call>
|
52 |
+
|
53 |
+
|
54 |
+
Maximum call level : 6
|
55 |
+
Maximum stack level: 3
|
56 |
+
Maximum stack size : 1920
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.cmic2
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.cmico
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
+Mdec
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.lst
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.map
ADDED
@@ -0,0 +1,202 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:00:41 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable22 ../Release/0_0_reloadable22.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable22.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6223 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
Memory map for memory 'DM_stack':
|
9 |
+
|
10 |
+
Size = 1048576
|
11 |
+
Width = 8 bits
|
12 |
+
Offset = 0
|
13 |
+
Used = 2368
|
14 |
+
|
15 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
16 |
+
|
17 |
+
Memory map for memory 'DMb':
|
18 |
+
|
19 |
+
Size = 1048576
|
20 |
+
Width = 8 bits
|
21 |
+
Offset = 0
|
22 |
+
Used = 3005
|
23 |
+
|
24 |
+
0x00000000..0x0007babf ( 506560 items) : Reserved
|
25 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
26 |
+
0x0007c400..0x0007c43f ( 64 items) : Reserved
|
27 |
+
0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable22.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
|
28 |
+
0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable22.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
|
29 |
+
0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable22.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
|
30 |
+
0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable22.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
|
31 |
+
0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable22.o::_ZN9ns_concatL11kernel_iterE (Data, Local, .bss.DMb.4)
|
32 |
+
0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable22.o::_ZN9ns_concatL8core_colE (Data, Local, .bss.DMb.4)
|
33 |
+
0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable22.o::_ZN9ns_concatL8core_rowE (Data, Local, .bss.DMb.4)
|
34 |
+
0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable22.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter (Data, Weak, .bss.DMb.4)
|
35 |
+
0x0007c460..0x0007c463 ( 4 items) : ../Release/0_0_reloadable22.o::_ZL8num_iter (Data, Local, .data.DMb.4)
|
36 |
+
0x0007c464..0x0007c467 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
|
37 |
+
0x0007c468..0x0007c468 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
|
38 |
+
0x0007c46c..0x0007c46f ( 4 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::float_rounding_mode (Data, Global, .bss.DMb.4)
|
39 |
+
0x0007c480..0x0007c48f ( 16 items) : ../Release/0_0_reloadable22.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
|
40 |
+
|
41 |
+
Called functions : _Z13_b787_wrapperPPv
|
42 |
+
_Z13_b896_wrapperPPv
|
43 |
+
_Z13_b806_wrapperPPv
|
44 |
+
_Z13_b820_wrapperPPv
|
45 |
+
|
46 |
+
0x0007c4c0..0x0007c67f ( 448 items) : ../Release/0_0_reloadable22.o::conv2d_params (Data, Global, .bss.DMb.64)
|
47 |
+
0x0007c680..0x0007c6ff ( 128 items) : ../Release/0_0_reloadable22.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params (Data, Weak, .bss.DMb.64)
|
48 |
+
0x0007ccc0..0x000fffff ( 537408 items) : Reserved
|
49 |
+
|
50 |
+
Memory map for memory 'PM':
|
51 |
+
|
52 |
+
Size = 1048576
|
53 |
+
Width = 8 bits
|
54 |
+
Offset = 0
|
55 |
+
Used = 13462
|
56 |
+
|
57 |
+
0x00000000..0x0000092f ( 2352 items) : Reserved
|
58 |
+
0x00000930..0x00000b51 ( 546 items) : ../Release/0_0_reloadable22.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
|
59 |
+
|
60 |
+
Referenced symbols: _ZL20g_uniformKernelFuncs
|
61 |
+
|
62 |
+
0x00000b60..0x000010f5 ( 1430 items) : ../Release/0_0_reloadable22.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
|
63 |
+
0x00001100..0x0000120d ( 270 items) : ../Release/0_0_reloadable22.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
|
64 |
+
|
65 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
66 |
+
|
67 |
+
0x00001210..0x00001b79 ( 2410 items) : ../Release/0_0_reloadable22.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
|
68 |
+
|
69 |
+
Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
70 |
+
|
71 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
72 |
+
|
73 |
+
0x00001b80..0x00001db7 ( 568 items) : ../Release/0_0_reloadable22.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
74 |
+
|
75 |
+
Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
76 |
+
_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
77 |
+
|
78 |
+
Referenced symbols: _ZL9curr_iter
|
79 |
+
conv2d_params
|
80 |
+
_ZN12me_primitive11control_rndE
|
81 |
+
_ZN12me_primitive11control_satE
|
82 |
+
_ZL14num_depth_iter
|
83 |
+
_ZL8num_iter
|
84 |
+
_ZL10depth_iter
|
85 |
+
_ZL11total_iters
|
86 |
+
|
87 |
+
0x00001dc0..0x00002c85 ( 3782 items) : ../Release/0_0_reloadable22.o::_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params (Function, Weak, .text) (stack frame size = 1792)
|
88 |
+
|
89 |
+
Called functions : int32_to_float32
|
90 |
+
|
91 |
+
Referenced symbols: _ZN12me_primitive11control_satE
|
92 |
+
_ZN12me_primitive11control_rndE
|
93 |
+
|
94 |
+
0x00002c90..0x000031ed ( 1374 items) : ../Release/0_0_reloadable22.o::_ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj (Function, Weak, .text) (stack frame size = 64)
|
95 |
+
|
96 |
+
Called functions : _ZN12me_primitive10udiv_dstepEjjRjS0_
|
97 |
+
_Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params
|
98 |
+
|
99 |
+
Referenced symbols: _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter
|
100 |
+
_ZN12me_primitive11control_satE
|
101 |
+
_ZN12me_primitive11control_rndE
|
102 |
+
_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params
|
103 |
+
|
104 |
+
0x000031f0..0x0000320f ( 32 items) : ../Release/0_0_reloadable22.o::_Z13_b787_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
105 |
+
|
106 |
+
Called functions : _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
|
107 |
+
|
108 |
+
0x00003210..0x00003233 ( 36 items) : ../Release/0_0_reloadable22.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
109 |
+
|
110 |
+
Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
111 |
+
|
112 |
+
0x00003240..0x0000354d ( 782 items) : ../Release/0_0_reloadable22.o::_Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params (Function, Weak, .text) (stack frame size = 0)
|
113 |
+
0x00003550..0x000037f1 ( 674 items) : ../Release/0_0_reloadable22.o::_ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj (Function, Weak, .text) (stack frame size = 192)
|
114 |
+
|
115 |
+
Called functions : _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
|
116 |
+
|
117 |
+
0x00003800..0x0000381f ( 32 items) : ../Release/0_0_reloadable22.o::_Z13_b806_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
118 |
+
|
119 |
+
Called functions : _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
|
120 |
+
|
121 |
+
0x00003820..0x00003b51 ( 818 items) : ../Release/0_0_reloadable22.o::_ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj (Function, Weak, .text) (stack frame size = 0)
|
122 |
+
|
123 |
+
Referenced symbols: _ZN9ns_concatL11kernel_iterE
|
124 |
+
_ZN12me_primitive11control_rndE
|
125 |
+
_ZN9ns_concatL8core_rowE
|
126 |
+
_ZN12me_primitive11control_satE
|
127 |
+
_ZN9ns_concatL8core_colE
|
128 |
+
|
129 |
+
0x00003b60..0x00003b83 ( 36 items) : ../Release/0_0_reloadable22.o::_Z13_b820_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
130 |
+
|
131 |
+
Called functions : _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj
|
132 |
+
|
133 |
+
0x00003b90..0x00003c1d ( 142 items) : me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive10udiv_dstepEjjRjS0_ (Function, Global, .text) (stack frame size = 0)
|
134 |
+
0x00003c20..0x00003da7 ( 392 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::_ZL19roundAndPackFloat32iij (Function, Local, .text) (stack frame size = 0)
|
135 |
+
|
136 |
+
Referenced symbols: float_rounding_mode
|
137 |
+
|
138 |
+
0x00003db0..0x00003dc7 ( 24 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::_ZL28normalizeRoundAndPackFloat32iij (Function, Local, .text) (stack frame size = 0)
|
139 |
+
|
140 |
+
Called functions : _ZL19roundAndPackFloat32iij
|
141 |
+
|
142 |
+
0x00003dd0..0x00003e41 ( 114 items) : softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)::int32_to_float32 (Function, Global, .text) (stack frame size = 0)
|
143 |
+
|
144 |
+
Called functions : _ZL28normalizeRoundAndPackFloat32iij
|
145 |
+
|
146 |
+
|
147 |
+
External symbols:
|
148 |
+
|
149 |
+
__dso_handle = 0x0
|
150 |
+
_ctors_end = 0x0
|
151 |
+
_ctors_start = 0x0
|
152 |
+
_dtors_end = 0x0
|
153 |
+
_dtors_start = 0x0
|
154 |
+
_pc_end = 0x3e42
|
155 |
+
_pc_start = 0x930
|
156 |
+
_sp_end_DM_stack = 0x7c400
|
157 |
+
_sp_start_DM_stack = 0x7bac0
|
158 |
+
|
159 |
+
Section summary for memory 'DM_stack':
|
160 |
+
|
161 |
+
.stack File
|
162 |
+
---------- ----------
|
163 |
+
2368
|
164 |
+
---------- ----------
|
165 |
+
2368 Total
|
166 |
+
|
167 |
+
Section summary for memory 'DMb':
|
168 |
+
|
169 |
+
.bss .data .rodata File
|
170 |
+
---------- ---------- ---------- ----------
|
171 |
+
608 4 16 ../Release/0_0_reloadable22.o
|
172 |
+
4 0 0 softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)
|
173 |
+
5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
174 |
+
---------- ---------- ---------- ----------
|
175 |
+
617 4 16 Total
|
176 |
+
|
177 |
+
Section summary for memory 'PM':
|
178 |
+
|
179 |
+
.text File
|
180 |
+
---------- ----------
|
181 |
+
12790 ../Release/0_0_reloadable22.o
|
182 |
+
530 softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)
|
183 |
+
142 me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
184 |
+
---------- ----------
|
185 |
+
13462 Total
|
186 |
+
|
187 |
+
File summary:
|
188 |
+
|
189 |
+
../Release/0_0_reloadable22.o
|
190 |
+
DMb 628
|
191 |
+
PM 12790
|
192 |
+
|
193 |
+
me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
194 |
+
DMb 5
|
195 |
+
|
196 |
+
softfloat.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release/libsoftfloat.a)
|
197 |
+
DMb 4
|
198 |
+
PM 530
|
199 |
+
|
200 |
+
me_div.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
201 |
+
PM 142
|
202 |
+
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.sdr
ADDED
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:00:41 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable22 ../Release/0_0_reloadable22.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable22.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6223 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
// Symbols in memory 'DM_bankA':
|
9 |
+
// Symbols in memory 'DM_bankAB':
|
10 |
+
// Symbols in memory 'DM_bankAC':
|
11 |
+
// Symbols in memory 'DM_bankAD':
|
12 |
+
// Symbols in memory 'DM_bankB':
|
13 |
+
// Symbols in memory 'DM_bankBC':
|
14 |
+
// Symbols in memory 'DM_bankBD':
|
15 |
+
// Symbols in memory 'DM_bankC':
|
16 |
+
// Symbols in memory 'DM_bankCD':
|
17 |
+
// Symbols in memory 'DM_bankD':
|
18 |
+
// Symbols in memory 'DM_stack':
|
19 |
+
// Symbols in memory 'DM_test':
|
20 |
+
// Symbols in memory 'DMb':
|
21 |
+
_symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter 0x0007c45c
|
22 |
+
_symbol _ZN12me_primitive11control_satE 0x0007c464
|
23 |
+
_symbol _ZN12me_primitive11control_rndE 0x0007c468
|
24 |
+
_symbol float_rounding_mode 0x0007c46c
|
25 |
+
_symbol conv2d_params 0x0007c4c0
|
26 |
+
_symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params 0x0007c680
|
27 |
+
// Symbols in memory 'DMh':
|
28 |
+
// Symbols in memory 'DMh_bankA':
|
29 |
+
// Symbols in memory 'DMh_bankAB':
|
30 |
+
// Symbols in memory 'DMh_bankAC':
|
31 |
+
// Symbols in memory 'DMh_bankAD':
|
32 |
+
// Symbols in memory 'DMh_bankB':
|
33 |
+
// Symbols in memory 'DMh_bankBC':
|
34 |
+
// Symbols in memory 'DMh_bankBD':
|
35 |
+
// Symbols in memory 'DMh_bankC':
|
36 |
+
// Symbols in memory 'DMh_bankCD':
|
37 |
+
// Symbols in memory 'DMh_bankD':
|
38 |
+
// Symbols in memory 'DMh_stack':
|
39 |
+
// Symbols in memory 'DMs':
|
40 |
+
// Symbols in memory 'DMs_bankA':
|
41 |
+
// Symbols in memory 'DMs_bankAB':
|
42 |
+
// Symbols in memory 'DMs_bankAC':
|
43 |
+
// Symbols in memory 'DMs_bankAD':
|
44 |
+
// Symbols in memory 'DMs_bankB':
|
45 |
+
// Symbols in memory 'DMs_bankBC':
|
46 |
+
// Symbols in memory 'DMs_bankBD':
|
47 |
+
// Symbols in memory 'DMs_bankC':
|
48 |
+
// Symbols in memory 'DMs_bankCD':
|
49 |
+
// Symbols in memory 'DMs_bankD':
|
50 |
+
// Symbols in memory 'DMs_stack':
|
51 |
+
// Symbols in memory 'DMv':
|
52 |
+
// Symbols in memory 'DMv_bankA':
|
53 |
+
// Symbols in memory 'DMv_bankAB':
|
54 |
+
// Symbols in memory 'DMv_bankAC':
|
55 |
+
// Symbols in memory 'DMv_bankAD':
|
56 |
+
// Symbols in memory 'DMv_bankB':
|
57 |
+
// Symbols in memory 'DMv_bankBC':
|
58 |
+
// Symbols in memory 'DMv_bankBD':
|
59 |
+
// Symbols in memory 'DMv_bankC':
|
60 |
+
// Symbols in memory 'DMv_bankCD':
|
61 |
+
// Symbols in memory 'DMv_bankD':
|
62 |
+
// Symbols in memory 'DMv_stack':
|
63 |
+
// Symbols in memory 'DMw':
|
64 |
+
// Symbols in memory 'DMw_bankA':
|
65 |
+
// Symbols in memory 'DMw_bankAB':
|
66 |
+
// Symbols in memory 'DMw_bankAC':
|
67 |
+
// Symbols in memory 'DMw_bankAD':
|
68 |
+
// Symbols in memory 'DMw_bankB':
|
69 |
+
// Symbols in memory 'DMw_bankBC':
|
70 |
+
// Symbols in memory 'DMw_bankBD':
|
71 |
+
// Symbols in memory 'DMw_bankC':
|
72 |
+
// Symbols in memory 'DMw_bankCD':
|
73 |
+
// Symbols in memory 'DMw_bankD':
|
74 |
+
// Symbols in memory 'DMw_stack':
|
75 |
+
// Symbols in memory 'DMx':
|
76 |
+
// Symbols in memory 'DMx_bankA':
|
77 |
+
// Symbols in memory 'DMx_bankAB':
|
78 |
+
// Symbols in memory 'DMx_bankAC':
|
79 |
+
// Symbols in memory 'DMx_bankAD':
|
80 |
+
// Symbols in memory 'DMx_bankB':
|
81 |
+
// Symbols in memory 'DMx_bankBC':
|
82 |
+
// Symbols in memory 'DMx_bankBD':
|
83 |
+
// Symbols in memory 'DMx_bankC':
|
84 |
+
// Symbols in memory 'DMx_bankCD':
|
85 |
+
// Symbols in memory 'DMx_bankD':
|
86 |
+
// Symbols in memory 'DMx_stack':
|
87 |
+
// Symbols in memory 'PM':
|
88 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x00000930
|
89 |
+
_symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000b60
|
90 |
+
_symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001100
|
91 |
+
_symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001210
|
92 |
+
_symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001b80
|
93 |
+
_symbol _Z15resize_bilinearI8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_aS0_EEvPS1_S2_R29resize_common_internal_params 0x00001dc0
|
94 |
+
_symbol _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi0EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj 0x00002c90
|
95 |
+
_symbol _Z13_b787_wrapperPPv 0x000031f0
|
96 |
+
_symbol _Z13_b896_wrapperPPv 0x00003210
|
97 |
+
_symbol _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params 0x00003240
|
98 |
+
_symbol _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj 0x00003550
|
99 |
+
_symbol _Z13_b806_wrapperPPv 0x00003800
|
100 |
+
_symbol _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj 0x00003820
|
101 |
+
_symbol _Z13_b820_wrapperPPv 0x00003b60
|
102 |
+
_symbol _ZN12me_primitive10udiv_dstepEjjRjS0_ 0x00003b90
|
103 |
+
_symbol int32_to_float32 0x00003dd0
|
104 |
+
// Symbols in memory 'PMw':
|
105 |
+
// Symbols in memory 'TM4':
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.srv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/Release/0_2_reloadable22.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/scripts/0_2_reloadable22.bcf
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_reserved DMb 0x0 0x40000
|
2 |
+
|
3 |
+
_reserved PM 0x0 0x930 //reserved for main elf
|
4 |
+
|
5 |
+
_entry_point _Z13kernelWrapperPPvjjjj
|
6 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x930
|
7 |
+
|
8 |
+
_reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
|
9 |
+
_reserved DMb 0x7ba80 0x40 //reserved for sync buffer
|
10 |
+
_stack DM_stack 0x7bac0 0x940 //stack for core
|
11 |
+
_reserved DMb 0x7c400 0x40 //reserved for main elf heap
|
12 |
+
//space for synopsys compiler at 0x7c440 0x880//heap
|
13 |
+
_reserved DMb 0x40000 0x3b280
|
14 |
+
|
15 |
+
_reserved DMb 0x7ccc0 0x3340
|
16 |
+
_reserved DMb 0x80000 0x80000 // And everything else the core can't see
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/scripts/0_2_reloadable22.prx
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<project name="Project" processor="me">
|
2 |
+
<issinit/>
|
3 |
+
<option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
|
4 |
+
<option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
|
5 |
+
<option id="llvm.lang" value="Follow file extension"/>
|
6 |
+
<option id="bridge.cfg" value="0_2_reloadable22.bcf"/>
|
7 |
+
<option id="bridge.alibs" value=" ../Release/0_2_reloadable22.o" inherit="1" cfg="Release_LLVM"/>
|
8 |
+
<option id="cpp.include" value="<XILINX_VITIS_AIETOOLS>/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/<AIE_SRC_DIR> " inherit="1"/>
|
9 |
+
<option id="project.dir" value="<CONFIG>/0_2_reloadable22"/>
|
10 |
+
<option id="project.name" value="0_2_reloadable22"/>
|
11 |
+
<option id="project.type" value="exe"/>
|
12 |
+
<option id="simrun.issca" value="<XILINX_VITIS_AIETOOLS>/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
|
13 |
+
</project>
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable22/src/0_2_reloadable22.cc
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
// Automatically generated processor driver using AIEngine tool-chain
|
2 |
+
|
3 |
+
#include <stdio.h>
|
4 |
+
#include <memory>
|
5 |
+
#include <adf.h>
|
6 |
+
|
7 |
+
|
8 |
+
// Declare Kernel functions and initializers
|
9 |
+
#include "resize_adf_wrapper.cpp"
|
10 |
+
void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
11 |
+
#include "slice_adf_wrapper.cpp"
|
12 |
+
#include "concat_adf_wrapper.cpp"
|
13 |
+
|
14 |
+
// Declare Kernel objects and external arrays
|
15 |
+
|
16 |
+
|
17 |
+
void _b787_wrapper(void* args[])
|
18 |
+
{
|
19 |
+
mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 0>(
|
20 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
21 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
22 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]));
|
23 |
+
}
|
24 |
+
|
25 |
+
void _b896_wrapper(void* args[])
|
26 |
+
{
|
27 |
+
conv2d_maxpool(
|
28 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
29 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
30 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
31 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
32 |
+
}
|
33 |
+
|
34 |
+
void _b806_wrapper(void* args[])
|
35 |
+
{
|
36 |
+
mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
|
37 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
38 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
39 |
+
*reinterpret_cast<uint32 const(*)[7]>(args[2]));
|
40 |
+
}
|
41 |
+
|
42 |
+
void _b820_wrapper(void* args[])
|
43 |
+
{
|
44 |
+
mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
|
45 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
46 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
47 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[2]),
|
48 |
+
*reinterpret_cast<uint32 const(*)[8]>(args[3]));
|
49 |
+
}
|
50 |
+
|
51 |
+
using UniformKernelFunc = void (*)(void **);
|
52 |
+
|
53 |
+
static UniformKernelFunc g_uniformKernelFuncs[4] = {
|
54 |
+
_b787_wrapper,
|
55 |
+
_b896_wrapper,
|
56 |
+
_b806_wrapper,
|
57 |
+
_b820_wrapper
|
58 |
+
};
|
59 |
+
|
60 |
+
__attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
|
61 |
+
{
|
62 |
+
uint32 idx = 0;
|
63 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
|
64 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
65 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
|
66 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
67 |
+
idx += numAsyncIn;
|
68 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::out>(numSyncOut > 0);
|
69 |
+
idx += (numSyncOut > 0) ? 1 : 0;
|
70 |
+
|
71 |
+
(*(g_uniformKernelFuncs[kernelId]))(args);
|
72 |
+
|
73 |
+
idx = 0;
|
74 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
|
75 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
76 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
|
77 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
78 |
+
idx += numAsyncIn;
|
79 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::out>(numSyncOut > 0);
|
80 |
+
idx += (numSyncOut > 0) ? 1 : 0;
|
81 |
+
}
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.calltree
ADDED
@@ -0,0 +1,92 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:02:00 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable23 ../Release/0_0_reloadable23.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable23.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6583 -pme
|
5 |
+
|
6 |
+
|
7 |
+
// Release: ipp V-2024.06-TGT-241219
|
8 |
+
|
9 |
+
_Z13kernelWrapperPPvjjjj
|
10 |
+
_Z14_b1638_wrapperPPv (referenced text)
|
11 |
+
_Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
12 |
+
_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
13 |
+
_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
14 |
+
_Z13_b806_wrapperPPv (referenced text)
|
15 |
+
_ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
|
16 |
+
_Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
|
17 |
+
_Z14_b1655_wrapperPPv (referenced text)
|
18 |
+
_Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
19 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
|
20 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
|
21 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
|
22 |
+
_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
23 |
+
_Z13_b891_wrapperPPv (referenced text)
|
24 |
+
_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
25 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
|
26 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
|
27 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
|
28 |
+
_Z13_b820_wrapperPPv (referenced text)
|
29 |
+
_ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj
|
30 |
+
_Z13_b896_wrapperPPv (referenced text)
|
31 |
+
_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
32 |
+
_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
33 |
+
_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
34 |
+
_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
35 |
+
_Z14_b1672_wrapperPPv (referenced text)
|
36 |
+
_Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
37 |
+
_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
38 |
+
_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
39 |
+
_Z13_b886_wrapperPPv (referenced text)
|
40 |
+
_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
41 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
|
42 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
|
43 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
|
44 |
+
_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (*)
|
45 |
+
|
46 |
+
|
47 |
+
Call tree stack and functions sizes:
|
48 |
+
|
49 |
+
stack stack stack call func func function name
|
50 |
+
desc level level desc
|
51 |
+
----- ----- ----- ----- ----- ----- --------------------------------------------------------------
|
52 |
+
64 512 0 0 546 13444 _Z13kernelWrapperPPvjjjj
|
53 |
+
0 64 1 1 32 960 _Z14_b1638_wrapperPPv
|
54 |
+
64 64 1 2 488 928 _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
|
55 |
+
0 0 2 3 62 62 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
56 |
+
0 0 2 3 378 378 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
57 |
+
0 192 1 1 32 1488 _Z13_b806_wrapperPPv
|
58 |
+
192 192 1 2 674 1456 _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj <tail call>
|
59 |
+
0 0 2 3 782 782 _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
|
60 |
+
0 192 1 1 36 1378 _Z14_b1655_wrapperPPv
|
61 |
+
64 192 1 2 602 1342 _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
|
62 |
+
64 64 2 3 74 190 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
|
63 |
+
0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
|
64 |
+
0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
|
65 |
+
128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
|
66 |
+
0 128 1 1 36 1092 _Z13_b891_wrapperPPv
|
67 |
+
64 128 1 2 602 1056 _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
|
68 |
+
64 64 2 3 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
|
69 |
+
0 0 3 4 24 24 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
|
70 |
+
0 0 2 3 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
|
71 |
+
0 0 1 1 36 854 _Z13_b820_wrapperPPv
|
72 |
+
0 0 1 2 818 818 _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj <tail call>
|
73 |
+
0 192 1 1 36 4714 _Z13_b896_wrapperPPv
|
74 |
+
64 192 1 2 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
|
75 |
+
64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
76 |
+
128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
77 |
+
0 0 3 4 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
78 |
+
0 448 1 1 32 1544 _Z14_b1672_wrapperPPv
|
79 |
+
64 448 1 2 488 1512 _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
|
80 |
+
0 0 2 3 62 62 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
81 |
+
384 384 2 3 962 962 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
82 |
+
0 192 1 1 36 1402 _Z13_b886_wrapperPPv
|
83 |
+
64 192 1 2 602 1366 _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
|
84 |
+
64 64 2 3 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
|
85 |
+
0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
|
86 |
+
0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
|
87 |
+
128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
|
88 |
+
|
89 |
+
|
90 |
+
Maximum call level : 4
|
91 |
+
Maximum stack level: 3
|
92 |
+
Maximum stack size : 512
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.cmic2
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.cmico
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
+Mdec
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.lst
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.map
ADDED
@@ -0,0 +1,296 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:02:00 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable23 ../Release/0_0_reloadable23.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable23.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6583 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
Memory map for memory 'DM_stack':
|
9 |
+
|
10 |
+
Size = 1048576
|
11 |
+
Width = 8 bits
|
12 |
+
Offset = 0
|
13 |
+
Used = 2368
|
14 |
+
|
15 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
16 |
+
|
17 |
+
Memory map for memory 'DMb':
|
18 |
+
|
19 |
+
Size = 1048576
|
20 |
+
Width = 8 bits
|
21 |
+
Offset = 0
|
22 |
+
Used = 3217
|
23 |
+
|
24 |
+
0x00000000..0x0007babf ( 506560 items) : Reserved
|
25 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
26 |
+
0x0007c400..0x0007c43f ( 64 items) : Reserved
|
27 |
+
0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable23.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
|
28 |
+
0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable23.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
|
29 |
+
0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable23.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
|
30 |
+
0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable23.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
|
31 |
+
0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable23.o::_ZL8core_row (Data, Local, .bss.DMb.4)
|
32 |
+
0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable23.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
|
33 |
+
0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable23.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
|
34 |
+
0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable23.o::_ZN9ns_concatL11kernel_iterE (Data, Local, .bss.DMb.4)
|
35 |
+
0x0007c460..0x0007c463 ( 4 items) : ../Release/0_0_reloadable23.o::_ZN9ns_concatL8core_colE (Data, Local, .bss.DMb.4)
|
36 |
+
0x0007c464..0x0007c467 ( 4 items) : ../Release/0_0_reloadable23.o::_ZN9ns_concatL8core_rowE (Data, Local, .bss.DMb.4)
|
37 |
+
0x0007c468..0x0007c46b ( 4 items) : ../Release/0_0_reloadable23.o::_ZL8num_iter (Data, Local, .data.DMb.4)
|
38 |
+
0x0007c46c..0x0007c46f ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
|
39 |
+
0x0007c470..0x0007c470 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
|
40 |
+
0x0007c480..0x0007c49f ( 32 items) : ../Release/0_0_reloadable23.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
|
41 |
+
|
42 |
+
Called functions : _Z14_b1638_wrapperPPv
|
43 |
+
_Z13_b806_wrapperPPv
|
44 |
+
_Z14_b1655_wrapperPPv
|
45 |
+
_Z13_b891_wrapperPPv
|
46 |
+
_Z13_b820_wrapperPPv
|
47 |
+
_Z13_b896_wrapperPPv
|
48 |
+
_Z14_b1672_wrapperPPv
|
49 |
+
_Z13_b886_wrapperPPv
|
50 |
+
|
51 |
+
0x0007c4c0..0x0007c4ff ( 64 items) : ../Release/0_0_reloadable23.o::add1d_params (Data, Global, .bss.DMb.64)
|
52 |
+
0x0007c500..0x0007c53f ( 64 items) : ../Release/0_0_reloadable23.o::mul1d_params (Data, Global, .bss.DMb.64)
|
53 |
+
0x0007c540..0x0007c57f ( 64 items) : ../Release/0_0_reloadable23.o::sub1d_params (Data, Global, .bss.DMb.64)
|
54 |
+
0x0007c580..0x0007c5bf ( 64 items) : ../Release/0_0_reloadable23.o::sigmoid1d_params (Data, Global, .bss.DMb.64)
|
55 |
+
0x0007c5c0..0x0007c5ff ( 64 items) : ../Release/0_0_reloadable23.o::tanh1d_params (Data, Global, .bss.DMb.64)
|
56 |
+
0x0007c600..0x0007c7bf ( 448 items) : ../Release/0_0_reloadable23.o::conv2d_params (Data, Global, .bss.DMb.64)
|
57 |
+
0x0007ccc0..0x000fffff ( 537408 items) : Reserved
|
58 |
+
|
59 |
+
Memory map for memory 'PM':
|
60 |
+
|
61 |
+
Size = 1048576
|
62 |
+
Width = 8 bits
|
63 |
+
Offset = 0
|
64 |
+
Used = 13444
|
65 |
+
|
66 |
+
0x00000000..0x0000092f ( 2352 items) : Reserved
|
67 |
+
0x00000930..0x00000b51 ( 546 items) : ../Release/0_0_reloadable23.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
|
68 |
+
|
69 |
+
Referenced symbols: _ZL20g_uniformKernelFuncs
|
70 |
+
|
71 |
+
0x00000b60..0x000010f5 ( 1430 items) : ../Release/0_0_reloadable23.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
|
72 |
+
0x00001100..0x0000120d ( 270 items) : ../Release/0_0_reloadable23.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
|
73 |
+
|
74 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
75 |
+
|
76 |
+
0x00001210..0x00001b79 ( 2410 items) : ../Release/0_0_reloadable23.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
|
77 |
+
|
78 |
+
Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
79 |
+
|
80 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
81 |
+
|
82 |
+
0x00001b80..0x00001db7 ( 568 items) : ../Release/0_0_reloadable23.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
83 |
+
|
84 |
+
Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
85 |
+
_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
86 |
+
|
87 |
+
Referenced symbols: _ZL9curr_iter
|
88 |
+
conv2d_params
|
89 |
+
_ZN12me_primitive11control_rndE
|
90 |
+
_ZN12me_primitive11control_satE
|
91 |
+
_ZL14num_depth_iter
|
92 |
+
_ZL8num_iter
|
93 |
+
_ZL10depth_iter
|
94 |
+
_ZL11total_iters
|
95 |
+
|
96 |
+
0x00001dc0..0x00001fd5 ( 534 items) : ../Release/0_0_reloadable23.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
|
97 |
+
|
98 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
99 |
+
|
100 |
+
0x00001fe0..0x0000201d ( 62 items) : ../Release/0_0_reloadable23.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
101 |
+
0x00002020..0x00002199 ( 378 items) : ../Release/0_0_reloadable23.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
102 |
+
|
103 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
104 |
+
|
105 |
+
0x000021a0..0x00002387 ( 488 items) : ../Release/0_0_reloadable23.o::_Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
106 |
+
|
107 |
+
Called functions : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
108 |
+
_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
109 |
+
|
110 |
+
Referenced symbols: _ZL9curr_iter
|
111 |
+
_ZL8core_row
|
112 |
+
sigmoid1d_params
|
113 |
+
_ZN12me_primitive11control_rndE
|
114 |
+
_ZN12me_primitive11control_satE
|
115 |
+
_ZL11ifm1_offset
|
116 |
+
_ZL8num_iter
|
117 |
+
|
118 |
+
0x00002390..0x000023cd ( 62 items) : ../Release/0_0_reloadable23.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
119 |
+
0x000023d0..0x00002791 ( 962 items) : ../Release/0_0_reloadable23.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 384)
|
120 |
+
|
121 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
122 |
+
|
123 |
+
0x000027a0..0x00002987 ( 488 items) : ../Release/0_0_reloadable23.o::_Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
124 |
+
|
125 |
+
Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
126 |
+
_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
127 |
+
|
128 |
+
Referenced symbols: _ZL9curr_iter
|
129 |
+
_ZL8core_row
|
130 |
+
tanh1d_params
|
131 |
+
_ZN12me_primitive11control_rndE
|
132 |
+
_ZN12me_primitive11control_satE
|
133 |
+
_ZL11ifm1_offset
|
134 |
+
_ZL8num_iter
|
135 |
+
|
136 |
+
0x00002990..0x00002a03 ( 116 items) : ../Release/0_0_reloadable23.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
|
137 |
+
0x00002a10..0x00002a71 ( 98 items) : ../Release/0_0_reloadable23.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
|
138 |
+
|
139 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
|
140 |
+
|
141 |
+
0x00002a80..0x00002a8f ( 16 items) : ../Release/0_0_reloadable23.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
|
142 |
+
|
143 |
+
Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
144 |
+
|
145 |
+
0x00002a90..0x00002ce9 ( 602 items) : ../Release/0_0_reloadable23.o::_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
146 |
+
|
147 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
|
148 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
|
149 |
+
|
150 |
+
Referenced symbols: _ZL9curr_iter
|
151 |
+
_ZL8core_row
|
152 |
+
add1d_params
|
153 |
+
_ZN12me_primitive11control_rndE
|
154 |
+
_ZN12me_primitive11control_satE
|
155 |
+
_ZL11ifm1_offset
|
156 |
+
_ZL11ifm2_offset
|
157 |
+
_ZL8num_iter
|
158 |
+
|
159 |
+
0x00002cf0..0x00002d07 ( 24 items) : ../Release/0_0_reloadable23.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
160 |
+
0x00002d10..0x00002d99 ( 138 items) : ../Release/0_0_reloadable23.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
|
161 |
+
|
162 |
+
Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
|
163 |
+
|
164 |
+
0x00002da0..0x00002ec3 ( 292 items) : ../Release/0_0_reloadable23.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
165 |
+
|
166 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
167 |
+
|
168 |
+
0x00002ed0..0x00003129 ( 602 items) : ../Release/0_0_reloadable23.o::_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
169 |
+
|
170 |
+
Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
|
171 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
|
172 |
+
|
173 |
+
Referenced symbols: _ZL9curr_iter
|
174 |
+
_ZL8core_row
|
175 |
+
mul1d_params
|
176 |
+
_ZN12me_primitive11control_rndE
|
177 |
+
_ZN12me_primitive11control_satE
|
178 |
+
_ZL11ifm1_offset
|
179 |
+
_ZL11ifm2_offset
|
180 |
+
_ZL8num_iter
|
181 |
+
|
182 |
+
0x00003130..0x000031a3 ( 116 items) : ../Release/0_0_reloadable23.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
183 |
+
0x000031b0..0x000031f9 ( 74 items) : ../Release/0_0_reloadable23.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
|
184 |
+
|
185 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
|
186 |
+
|
187 |
+
0x00003200..0x0000320f ( 16 items) : ../Release/0_0_reloadable23.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
188 |
+
|
189 |
+
Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
190 |
+
|
191 |
+
0x00003210..0x00003469 ( 602 items) : ../Release/0_0_reloadable23.o::_Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
192 |
+
|
193 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
|
194 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
|
195 |
+
|
196 |
+
Referenced symbols: _ZL9curr_iter
|
197 |
+
_ZL8core_row
|
198 |
+
sub1d_params
|
199 |
+
_ZN12me_primitive11control_rndE
|
200 |
+
_ZN12me_primitive11control_satE
|
201 |
+
_ZL11ifm1_offset
|
202 |
+
_ZL11ifm2_offset
|
203 |
+
_ZL8num_iter
|
204 |
+
|
205 |
+
0x00003470..0x0000348f ( 32 items) : ../Release/0_0_reloadable23.o::_Z14_b1638_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
206 |
+
|
207 |
+
Called functions : _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
208 |
+
|
209 |
+
0x00003490..0x0000379d ( 782 items) : ../Release/0_0_reloadable23.o::_Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params (Function, Weak, .text) (stack frame size = 0)
|
210 |
+
0x000037a0..0x00003a41 ( 674 items) : ../Release/0_0_reloadable23.o::_ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj (Function, Weak, .text) (stack frame size = 192)
|
211 |
+
|
212 |
+
Called functions : _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params
|
213 |
+
|
214 |
+
0x00003a50..0x00003a6f ( 32 items) : ../Release/0_0_reloadable23.o::_Z13_b806_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
215 |
+
|
216 |
+
Called functions : _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj
|
217 |
+
|
218 |
+
0x00003a70..0x00003a93 ( 36 items) : ../Release/0_0_reloadable23.o::_Z14_b1655_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
219 |
+
|
220 |
+
Called functions : _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
221 |
+
|
222 |
+
0x00003aa0..0x00003ac3 ( 36 items) : ../Release/0_0_reloadable23.o::_Z13_b891_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
223 |
+
|
224 |
+
Called functions : _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
225 |
+
|
226 |
+
0x00003ad0..0x00003e01 ( 818 items) : ../Release/0_0_reloadable23.o::_ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj (Function, Weak, .text) (stack frame size = 0)
|
227 |
+
|
228 |
+
Referenced symbols: _ZN9ns_concatL11kernel_iterE
|
229 |
+
_ZN12me_primitive11control_rndE
|
230 |
+
_ZN9ns_concatL8core_rowE
|
231 |
+
_ZN12me_primitive11control_satE
|
232 |
+
_ZN9ns_concatL8core_colE
|
233 |
+
|
234 |
+
0x00003e10..0x00003e33 ( 36 items) : ../Release/0_0_reloadable23.o::_Z13_b820_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
235 |
+
|
236 |
+
Called functions : _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj
|
237 |
+
|
238 |
+
0x00003e40..0x00003e63 ( 36 items) : ../Release/0_0_reloadable23.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
239 |
+
|
240 |
+
Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
241 |
+
|
242 |
+
0x00003e70..0x00003e8f ( 32 items) : ../Release/0_0_reloadable23.o::_Z14_b1672_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
243 |
+
|
244 |
+
Called functions : _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
245 |
+
|
246 |
+
0x00003e90..0x00003eb3 ( 36 items) : ../Release/0_0_reloadable23.o::_Z13_b886_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
247 |
+
|
248 |
+
Called functions : _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
249 |
+
|
250 |
+
|
251 |
+
External symbols:
|
252 |
+
|
253 |
+
__dso_handle = 0x0
|
254 |
+
_ctors_end = 0x0
|
255 |
+
_ctors_start = 0x0
|
256 |
+
_dtors_end = 0x0
|
257 |
+
_dtors_start = 0x0
|
258 |
+
_pc_end = 0x3eb4
|
259 |
+
_pc_start = 0x930
|
260 |
+
_sp_end_DM_stack = 0x7c400
|
261 |
+
_sp_start_DM_stack = 0x7bac0
|
262 |
+
|
263 |
+
Section summary for memory 'DM_stack':
|
264 |
+
|
265 |
+
.stack File
|
266 |
+
---------- ----------
|
267 |
+
2368
|
268 |
+
---------- ----------
|
269 |
+
2368 Total
|
270 |
+
|
271 |
+
Section summary for memory 'DMb':
|
272 |
+
|
273 |
+
.bss .data .rodata File
|
274 |
+
---------- ---------- ---------- ----------
|
275 |
+
808 4 32 ../Release/0_0_reloadable23.o
|
276 |
+
5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
277 |
+
---------- ---------- ---------- ----------
|
278 |
+
813 4 32 Total
|
279 |
+
|
280 |
+
Section summary for memory 'PM':
|
281 |
+
|
282 |
+
.text File
|
283 |
+
---------- ----------
|
284 |
+
13444 ../Release/0_0_reloadable23.o
|
285 |
+
---------- ----------
|
286 |
+
13444 Total
|
287 |
+
|
288 |
+
File summary:
|
289 |
+
|
290 |
+
../Release/0_0_reloadable23.o
|
291 |
+
DMb 844
|
292 |
+
PM 13444
|
293 |
+
|
294 |
+
me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
295 |
+
DMb 5
|
296 |
+
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.sdr
ADDED
@@ -0,0 +1,125 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:02:00 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable23 ../Release/0_0_reloadable23.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable23.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6583 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
// Symbols in memory 'DM_bankA':
|
9 |
+
// Symbols in memory 'DM_bankAB':
|
10 |
+
// Symbols in memory 'DM_bankAC':
|
11 |
+
// Symbols in memory 'DM_bankAD':
|
12 |
+
// Symbols in memory 'DM_bankB':
|
13 |
+
// Symbols in memory 'DM_bankBC':
|
14 |
+
// Symbols in memory 'DM_bankBD':
|
15 |
+
// Symbols in memory 'DM_bankC':
|
16 |
+
// Symbols in memory 'DM_bankCD':
|
17 |
+
// Symbols in memory 'DM_bankD':
|
18 |
+
// Symbols in memory 'DM_stack':
|
19 |
+
// Symbols in memory 'DM_test':
|
20 |
+
// Symbols in memory 'DMb':
|
21 |
+
_symbol _ZN12me_primitive11control_satE 0x0007c46c
|
22 |
+
_symbol _ZN12me_primitive11control_rndE 0x0007c470
|
23 |
+
_symbol add1d_params 0x0007c4c0
|
24 |
+
_symbol mul1d_params 0x0007c500
|
25 |
+
_symbol sub1d_params 0x0007c540
|
26 |
+
_symbol sigmoid1d_params 0x0007c580
|
27 |
+
_symbol tanh1d_params 0x0007c5c0
|
28 |
+
_symbol conv2d_params 0x0007c600
|
29 |
+
// Symbols in memory 'DMh':
|
30 |
+
// Symbols in memory 'DMh_bankA':
|
31 |
+
// Symbols in memory 'DMh_bankAB':
|
32 |
+
// Symbols in memory 'DMh_bankAC':
|
33 |
+
// Symbols in memory 'DMh_bankAD':
|
34 |
+
// Symbols in memory 'DMh_bankB':
|
35 |
+
// Symbols in memory 'DMh_bankBC':
|
36 |
+
// Symbols in memory 'DMh_bankBD':
|
37 |
+
// Symbols in memory 'DMh_bankC':
|
38 |
+
// Symbols in memory 'DMh_bankCD':
|
39 |
+
// Symbols in memory 'DMh_bankD':
|
40 |
+
// Symbols in memory 'DMh_stack':
|
41 |
+
// Symbols in memory 'DMs':
|
42 |
+
// Symbols in memory 'DMs_bankA':
|
43 |
+
// Symbols in memory 'DMs_bankAB':
|
44 |
+
// Symbols in memory 'DMs_bankAC':
|
45 |
+
// Symbols in memory 'DMs_bankAD':
|
46 |
+
// Symbols in memory 'DMs_bankB':
|
47 |
+
// Symbols in memory 'DMs_bankBC':
|
48 |
+
// Symbols in memory 'DMs_bankBD':
|
49 |
+
// Symbols in memory 'DMs_bankC':
|
50 |
+
// Symbols in memory 'DMs_bankCD':
|
51 |
+
// Symbols in memory 'DMs_bankD':
|
52 |
+
// Symbols in memory 'DMs_stack':
|
53 |
+
// Symbols in memory 'DMv':
|
54 |
+
// Symbols in memory 'DMv_bankA':
|
55 |
+
// Symbols in memory 'DMv_bankAB':
|
56 |
+
// Symbols in memory 'DMv_bankAC':
|
57 |
+
// Symbols in memory 'DMv_bankAD':
|
58 |
+
// Symbols in memory 'DMv_bankB':
|
59 |
+
// Symbols in memory 'DMv_bankBC':
|
60 |
+
// Symbols in memory 'DMv_bankBD':
|
61 |
+
// Symbols in memory 'DMv_bankC':
|
62 |
+
// Symbols in memory 'DMv_bankCD':
|
63 |
+
// Symbols in memory 'DMv_bankD':
|
64 |
+
// Symbols in memory 'DMv_stack':
|
65 |
+
// Symbols in memory 'DMw':
|
66 |
+
// Symbols in memory 'DMw_bankA':
|
67 |
+
// Symbols in memory 'DMw_bankAB':
|
68 |
+
// Symbols in memory 'DMw_bankAC':
|
69 |
+
// Symbols in memory 'DMw_bankAD':
|
70 |
+
// Symbols in memory 'DMw_bankB':
|
71 |
+
// Symbols in memory 'DMw_bankBC':
|
72 |
+
// Symbols in memory 'DMw_bankBD':
|
73 |
+
// Symbols in memory 'DMw_bankC':
|
74 |
+
// Symbols in memory 'DMw_bankCD':
|
75 |
+
// Symbols in memory 'DMw_bankD':
|
76 |
+
// Symbols in memory 'DMw_stack':
|
77 |
+
// Symbols in memory 'DMx':
|
78 |
+
// Symbols in memory 'DMx_bankA':
|
79 |
+
// Symbols in memory 'DMx_bankAB':
|
80 |
+
// Symbols in memory 'DMx_bankAC':
|
81 |
+
// Symbols in memory 'DMx_bankAD':
|
82 |
+
// Symbols in memory 'DMx_bankB':
|
83 |
+
// Symbols in memory 'DMx_bankBC':
|
84 |
+
// Symbols in memory 'DMx_bankBD':
|
85 |
+
// Symbols in memory 'DMx_bankC':
|
86 |
+
// Symbols in memory 'DMx_bankCD':
|
87 |
+
// Symbols in memory 'DMx_bankD':
|
88 |
+
// Symbols in memory 'DMx_stack':
|
89 |
+
// Symbols in memory 'PM':
|
90 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x00000930
|
91 |
+
_symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000b60
|
92 |
+
_symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001100
|
93 |
+
_symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001210
|
94 |
+
_symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001b80
|
95 |
+
_symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00001fe0
|
96 |
+
_symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002020
|
97 |
+
_symbol _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000021a0
|
98 |
+
_symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002390
|
99 |
+
_symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x000023d0
|
100 |
+
_symbol _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000027a0
|
101 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00002990
|
102 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00002a10
|
103 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00002a80
|
104 |
+
_symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002a90
|
105 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002cf0
|
106 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002d10
|
107 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00002da0
|
108 |
+
_symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002ed0
|
109 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00003130
|
110 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x000031b0
|
111 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E 0x00003200
|
112 |
+
_symbol _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00003210
|
113 |
+
_symbol _Z14_b1638_wrapperPPv 0x00003470
|
114 |
+
_symbol _Z11slice_hcwc8I8bfloat16EvPT_S2_R18slice_hcwc8_params 0x00003490
|
115 |
+
_symbol _ZN12mllib_graphs17slice_adf_wrapperILi1E8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_EEvRNS2_9io_bufferIT0_NS2_9direction2inET1_EERNSD_ISE_NSF_3outET2_EERA7_Kj 0x000037a0
|
116 |
+
_symbol _Z13_b806_wrapperPPv 0x00003a50
|
117 |
+
_symbol _Z14_b1655_wrapperPPv 0x00003a70
|
118 |
+
_symbol _Z13_b891_wrapperPPv 0x00003aa0
|
119 |
+
_symbol _ZN12mllib_graphs18concat_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_SC_EEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_SG_T1_EERNSD_ISE_NSF_3outET2_EERA8_Kj 0x00003ad0
|
120 |
+
_symbol _Z13_b820_wrapperPPv 0x00003e10
|
121 |
+
_symbol _Z13_b896_wrapperPPv 0x00003e40
|
122 |
+
_symbol _Z14_b1672_wrapperPPv 0x00003e70
|
123 |
+
_symbol _Z13_b886_wrapperPPv 0x00003e90
|
124 |
+
// Symbols in memory 'PMw':
|
125 |
+
// Symbols in memory 'TM4':
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.srv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/Release/0_2_reloadable23.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/scripts/0_2_reloadable23.bcf
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_reserved DMb 0x0 0x40000
|
2 |
+
|
3 |
+
_reserved PM 0x0 0x930 //reserved for main elf
|
4 |
+
|
5 |
+
_entry_point _Z13kernelWrapperPPvjjjj
|
6 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x930
|
7 |
+
|
8 |
+
_reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
|
9 |
+
_reserved DMb 0x7ba80 0x40 //reserved for sync buffer
|
10 |
+
_stack DM_stack 0x7bac0 0x940 //stack for core
|
11 |
+
_reserved DMb 0x7c400 0x40 //reserved for main elf heap
|
12 |
+
//space for synopsys compiler at 0x7c440 0x880//heap
|
13 |
+
_reserved DMb 0x40000 0x3b280
|
14 |
+
|
15 |
+
_reserved DMb 0x7ccc0 0x3340
|
16 |
+
_reserved DMb 0x80000 0x80000 // And everything else the core can't see
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/scripts/0_2_reloadable23.prx
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<project name="Project" processor="me">
|
2 |
+
<issinit/>
|
3 |
+
<option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
|
4 |
+
<option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
|
5 |
+
<option id="llvm.lang" value="Follow file extension"/>
|
6 |
+
<option id="bridge.cfg" value="0_2_reloadable23.bcf"/>
|
7 |
+
<option id="bridge.alibs" value=" ../Release/0_2_reloadable23.o" inherit="1" cfg="Release_LLVM"/>
|
8 |
+
<option id="cpp.include" value="<XILINX_VITIS_AIETOOLS>/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/<AIE_SRC_DIR> " inherit="1"/>
|
9 |
+
<option id="project.dir" value="<CONFIG>/0_2_reloadable23"/>
|
10 |
+
<option id="project.name" value="0_2_reloadable23"/>
|
11 |
+
<option id="project.type" value="exe"/>
|
12 |
+
<option id="simrun.issca" value="<XILINX_VITIS_AIETOOLS>/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
|
13 |
+
</project>
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable23/src/0_2_reloadable23.cc
ADDED
@@ -0,0 +1,124 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
// Automatically generated processor driver using AIEngine tool-chain
|
2 |
+
|
3 |
+
#include <stdio.h>
|
4 |
+
#include <memory>
|
5 |
+
#include <adf.h>
|
6 |
+
|
7 |
+
|
8 |
+
// Declare Kernel functions and initializers
|
9 |
+
void superkernel_sigmoid1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
10 |
+
#include "slice_adf_wrapper.cpp"
|
11 |
+
void superkernel_sub1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
12 |
+
void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
13 |
+
#include "concat_adf_wrapper.cpp"
|
14 |
+
void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
15 |
+
void superkernel_tanh1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
16 |
+
void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
17 |
+
|
18 |
+
// Declare Kernel objects and external arrays
|
19 |
+
|
20 |
+
|
21 |
+
void _b1638_wrapper(void* args[])
|
22 |
+
{
|
23 |
+
superkernel_sigmoid1d(
|
24 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
25 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]),
|
26 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
|
27 |
+
}
|
28 |
+
|
29 |
+
void _b806_wrapper(void* args[])
|
30 |
+
{
|
31 |
+
mllib_graphs::slice_adf_wrapper<1, bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
|
32 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
33 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
34 |
+
*reinterpret_cast<uint32 const(*)[7]>(args[2]));
|
35 |
+
}
|
36 |
+
|
37 |
+
void _b1655_wrapper(void* args[])
|
38 |
+
{
|
39 |
+
superkernel_sub1d(
|
40 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
41 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
42 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
43 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
44 |
+
}
|
45 |
+
|
46 |
+
void _b891_wrapper(void* args[])
|
47 |
+
{
|
48 |
+
superkernel_mul1d(
|
49 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
50 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
51 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
52 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
53 |
+
}
|
54 |
+
|
55 |
+
void _b820_wrapper(void* args[])
|
56 |
+
{
|
57 |
+
mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(
|
58 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
59 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
60 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[2]),
|
61 |
+
*reinterpret_cast<uint32 const(*)[8]>(args[3]));
|
62 |
+
}
|
63 |
+
|
64 |
+
void _b896_wrapper(void* args[])
|
65 |
+
{
|
66 |
+
conv2d_maxpool(
|
67 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
68 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
69 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
70 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
71 |
+
}
|
72 |
+
|
73 |
+
void _b1672_wrapper(void* args[])
|
74 |
+
{
|
75 |
+
superkernel_tanh1d(
|
76 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
77 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]),
|
78 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
|
79 |
+
}
|
80 |
+
|
81 |
+
void _b886_wrapper(void* args[])
|
82 |
+
{
|
83 |
+
superkernel_add1d(
|
84 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
85 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
86 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
87 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
88 |
+
}
|
89 |
+
|
90 |
+
using UniformKernelFunc = void (*)(void **);
|
91 |
+
|
92 |
+
static UniformKernelFunc g_uniformKernelFuncs[8] = {
|
93 |
+
_b1638_wrapper,
|
94 |
+
_b806_wrapper,
|
95 |
+
_b1655_wrapper,
|
96 |
+
_b891_wrapper,
|
97 |
+
_b820_wrapper,
|
98 |
+
_b896_wrapper,
|
99 |
+
_b1672_wrapper,
|
100 |
+
_b886_wrapper
|
101 |
+
};
|
102 |
+
|
103 |
+
__attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
|
104 |
+
{
|
105 |
+
uint32 idx = 0;
|
106 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
|
107 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
108 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
|
109 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
110 |
+
idx += numAsyncIn;
|
111 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::out>(numSyncOut > 0);
|
112 |
+
idx += (numSyncOut > 0) ? 1 : 0;
|
113 |
+
|
114 |
+
(*(g_uniformKernelFuncs[kernelId]))(args);
|
115 |
+
|
116 |
+
idx = 0;
|
117 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
|
118 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
119 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
|
120 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
121 |
+
idx += numAsyncIn;
|
122 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::out>(numSyncOut > 0);
|
123 |
+
idx += (numSyncOut > 0) ? 1 : 0;
|
124 |
+
}
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.calltree
ADDED
@@ -0,0 +1,88 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:03:19 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable24 ../Release/0_0_reloadable24.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable24.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6947 -pme
|
5 |
+
|
6 |
+
|
7 |
+
// Release: ipp V-2024.06-TGT-241219
|
8 |
+
|
9 |
+
_Z13kernelWrapperPPvjjjj
|
10 |
+
_Z13_b853_wrapperPPv (referenced text)
|
11 |
+
_ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
|
12 |
+
_Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj
|
13 |
+
_Z13_b896_wrapperPPv (referenced text)
|
14 |
+
_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
15 |
+
_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
16 |
+
_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
17 |
+
_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
18 |
+
_Z14_b1638_wrapperPPv (referenced text)
|
19 |
+
_Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
20 |
+
_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
21 |
+
_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
22 |
+
_Z14_b1655_wrapperPPv (referenced text)
|
23 |
+
_Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
24 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
|
25 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
|
26 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
|
27 |
+
_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
28 |
+
_Z13_b891_wrapperPPv (referenced text)
|
29 |
+
_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
30 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
|
31 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
|
32 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
|
33 |
+
_Z14_b1672_wrapperPPv (referenced text)
|
34 |
+
_Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
35 |
+
_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
36 |
+
_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
37 |
+
_Z13_b886_wrapperPPv (referenced text)
|
38 |
+
_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
39 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
|
40 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
|
41 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
|
42 |
+
_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (*)
|
43 |
+
|
44 |
+
|
45 |
+
Call tree stack and functions sizes:
|
46 |
+
|
47 |
+
stack stack stack call func func function name
|
48 |
+
desc level level desc
|
49 |
+
----- ----- ----- ----- ----- ----- --------------------------------------------------------------
|
50 |
+
64 512 0 0 546 13188 _Z13kernelWrapperPPvjjjj
|
51 |
+
0 0 1 1 32 2086 _Z13_b853_wrapperPPv
|
52 |
+
0 0 1 2 470 2054 _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj <tail call>
|
53 |
+
0 0 1 3 1584 1584 _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj <tail call>
|
54 |
+
0 192 1 1 36 4714 _Z13_b896_wrapperPPv
|
55 |
+
64 192 1 2 568 4678 _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
|
56 |
+
64 64 2 3 1430 1430 _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
57 |
+
128 128 2 3 2410 2680 _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
58 |
+
0 0 3 4 270 270 _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
59 |
+
0 64 1 1 32 960 _Z14_b1638_wrapperPPv
|
60 |
+
64 64 1 2 488 928 _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
|
61 |
+
0 0 2 3 62 62 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
62 |
+
0 0 2 3 378 378 _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
63 |
+
0 192 1 1 36 1378 _Z14_b1655_wrapperPPv
|
64 |
+
64 192 1 2 602 1342 _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
|
65 |
+
64 64 2 3 74 190 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
|
66 |
+
0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
|
67 |
+
0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
|
68 |
+
128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
|
69 |
+
0 128 1 1 36 1092 _Z13_b891_wrapperPPv
|
70 |
+
64 128 1 2 602 1056 _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
|
71 |
+
64 64 2 3 138 162 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
|
72 |
+
0 0 3 4 24 24 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
|
73 |
+
0 0 2 3 292 292 _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
|
74 |
+
0 448 1 1 32 1544 _Z14_b1672_wrapperPPv
|
75 |
+
64 448 1 2 488 1512 _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE <tail call>
|
76 |
+
0 0 2 3 62 62 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
77 |
+
384 384 2 3 962 962 _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
78 |
+
0 192 1 1 36 1402 _Z13_b886_wrapperPPv
|
79 |
+
64 192 1 2 602 1366 _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE <tail call>
|
80 |
+
64 64 2 3 98 214 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
|
81 |
+
0 0 3 4 116 116 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
|
82 |
+
0 128 2 3 16 550 _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
|
83 |
+
128 128 2 4 534 534 _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE <tail call>
|
84 |
+
|
85 |
+
|
86 |
+
Maximum call level : 4
|
87 |
+
Maximum stack level: 3
|
88 |
+
Maximum stack size : 512
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.cmic2
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.cmico
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
+Mdec
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.lst
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.map
ADDED
@@ -0,0 +1,294 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:03:20 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable24 ../Release/0_0_reloadable24.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable24.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6947 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
Memory map for memory 'DM_stack':
|
9 |
+
|
10 |
+
Size = 1048576
|
11 |
+
Width = 8 bits
|
12 |
+
Offset = 0
|
13 |
+
Used = 2368
|
14 |
+
|
15 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
16 |
+
|
17 |
+
Memory map for memory 'DMb':
|
18 |
+
|
19 |
+
Size = 1048576
|
20 |
+
Width = 8 bits
|
21 |
+
Offset = 0
|
22 |
+
Used = 3397
|
23 |
+
|
24 |
+
0x00000000..0x0007babf ( 506560 items) : Reserved
|
25 |
+
0x0007bac0..0x0007c3ff ( 2368 items) : Stack
|
26 |
+
0x0007c400..0x0007c43f ( 64 items) : Reserved
|
27 |
+
0x0007c440..0x0007c443 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL9curr_iter (Data, Local, .bss.DMb.4)
|
28 |
+
0x0007c444..0x0007c447 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL14num_depth_iter (Data, Local, .bss.DMb.4)
|
29 |
+
0x0007c448..0x0007c44b ( 4 items) : ../Release/0_0_reloadable24.o::_ZL10depth_iter (Data, Local, .bss.DMb.4)
|
30 |
+
0x0007c44c..0x0007c44f ( 4 items) : ../Release/0_0_reloadable24.o::_ZL11total_iters (Data, Local, .bss.DMb.4)
|
31 |
+
0x0007c450..0x0007c453 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL8core_row (Data, Local, .bss.DMb.4)
|
32 |
+
0x0007c454..0x0007c457 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL11ifm1_offset (Data, Local, .bss.DMb.4)
|
33 |
+
0x0007c458..0x0007c45b ( 4 items) : ../Release/0_0_reloadable24.o::_ZL11ifm2_offset (Data, Local, .bss.DMb.4)
|
34 |
+
0x0007c45c..0x0007c45f ( 4 items) : ../Release/0_0_reloadable24.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter (Data, Weak, .bss.DMb.4)
|
35 |
+
0x0007c460..0x0007c463 ( 4 items) : ../Release/0_0_reloadable24.o::_ZL8num_iter (Data, Local, .data.DMb.4)
|
36 |
+
0x0007c464..0x0007c467 ( 4 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_satE (Data, Global, .bss.DMb.4)
|
37 |
+
0x0007c468..0x0007c468 ( 1 items) : me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)::_ZN12me_primitive11control_rndE (Data, Global, .bss.DMb.1)
|
38 |
+
0x0007c480..0x0007c49b ( 28 items) : ../Release/0_0_reloadable24.o::_ZL20g_uniformKernelFuncs (Data, Local, .rodata.DMb.64)
|
39 |
+
|
40 |
+
Called functions : _Z13_b853_wrapperPPv
|
41 |
+
_Z13_b896_wrapperPPv
|
42 |
+
_Z14_b1638_wrapperPPv
|
43 |
+
_Z14_b1655_wrapperPPv
|
44 |
+
_Z13_b891_wrapperPPv
|
45 |
+
_Z14_b1672_wrapperPPv
|
46 |
+
_Z13_b886_wrapperPPv
|
47 |
+
|
48 |
+
0x0007c4c0..0x0007c4df ( 32 items) : ../Release/0_0_reloadable24.o::__const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs (Data, Local, .rodata.DMb.64)
|
49 |
+
0x0007c500..0x0007c51f ( 32 items) : ../Release/0_0_reloadable24.o::__const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs_asymmetric (Data, Local, .rodata.DMb.64)
|
50 |
+
0x0007c540..0x0007c57f ( 64 items) : ../Release/0_0_reloadable24.o::add1d_params (Data, Global, .bss.DMb.64)
|
51 |
+
0x0007c580..0x0007c5bf ( 64 items) : ../Release/0_0_reloadable24.o::mul1d_params (Data, Global, .bss.DMb.64)
|
52 |
+
0x0007c5c0..0x0007c5ff ( 64 items) : ../Release/0_0_reloadable24.o::sub1d_params (Data, Global, .bss.DMb.64)
|
53 |
+
0x0007c600..0x0007c63f ( 64 items) : ../Release/0_0_reloadable24.o::sigmoid1d_params (Data, Global, .bss.DMb.64)
|
54 |
+
0x0007c640..0x0007c67f ( 64 items) : ../Release/0_0_reloadable24.o::tanh1d_params (Data, Global, .bss.DMb.64)
|
55 |
+
0x0007c680..0x0007c83f ( 448 items) : ../Release/0_0_reloadable24.o::conv2d_params (Data, Global, .bss.DMb.64)
|
56 |
+
0x0007c840..0x0007c8bf ( 128 items) : ../Release/0_0_reloadable24.o::_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params (Data, Weak, .bss.DMb.64)
|
57 |
+
0x0007ccc0..0x000fffff ( 537408 items) : Reserved
|
58 |
+
|
59 |
+
Memory map for memory 'PM':
|
60 |
+
|
61 |
+
Size = 1048576
|
62 |
+
Width = 8 bits
|
63 |
+
Offset = 0
|
64 |
+
Used = 13188
|
65 |
+
|
66 |
+
0x00000000..0x0000092f ( 2352 items) : Reserved
|
67 |
+
0x00000930..0x00000b51 ( 546 items) : ../Release/0_0_reloadable24.o::_Z13kernelWrapperPPvjjjj (Function, Global, .text) (stack frame size = 64)
|
68 |
+
|
69 |
+
Referenced symbols: _ZL20g_uniformKernelFuncs
|
70 |
+
|
71 |
+
0x00000b60..0x000010f5 ( 1430 items) : ../Release/0_0_reloadable24.o::_Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh (Function, Weak, .text) (stack frame size = 64)
|
72 |
+
0x00001100..0x0000120d ( 270 items) : ../Release/0_0_reloadable24.o::_Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams (Function, Weak, .text) (stack frame size = 0)
|
73 |
+
|
74 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
75 |
+
|
76 |
+
0x00001210..0x00001b79 ( 2410 items) : ../Release/0_0_reloadable24.o::_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params (Function, Weak, .text) (stack frame size = 128)
|
77 |
+
|
78 |
+
Called functions : _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams
|
79 |
+
|
80 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
81 |
+
|
82 |
+
0x00001b80..0x00001db7 ( 568 items) : ../Release/0_0_reloadable24.o::_Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
83 |
+
|
84 |
+
Called functions : _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh
|
85 |
+
_Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params
|
86 |
+
|
87 |
+
Referenced symbols: _ZL9curr_iter
|
88 |
+
conv2d_params
|
89 |
+
_ZN12me_primitive11control_rndE
|
90 |
+
_ZN12me_primitive11control_satE
|
91 |
+
_ZL14num_depth_iter
|
92 |
+
_ZL8num_iter
|
93 |
+
_ZL10depth_iter
|
94 |
+
_ZL11total_iters
|
95 |
+
|
96 |
+
0x00001dc0..0x00001fd5 ( 534 items) : ../Release/0_0_reloadable24.o::_ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE (Function, Local, .text) (stack frame size = 128)
|
97 |
+
|
98 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
99 |
+
|
100 |
+
0x00001fe0..0x0000201d ( 62 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
101 |
+
0x00002020..0x00002199 ( 378 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
102 |
+
|
103 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
104 |
+
|
105 |
+
0x000021a0..0x00002387 ( 488 items) : ../Release/0_0_reloadable24.o::_Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
106 |
+
|
107 |
+
Called functions : _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
108 |
+
_ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
109 |
+
|
110 |
+
Referenced symbols: _ZL9curr_iter
|
111 |
+
_ZL8core_row
|
112 |
+
sigmoid1d_params
|
113 |
+
_ZN12me_primitive11control_rndE
|
114 |
+
_ZN12me_primitive11control_satE
|
115 |
+
_ZL11ifm1_offset
|
116 |
+
_ZL8num_iter
|
117 |
+
|
118 |
+
0x00002390..0x000023cd ( 62 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
119 |
+
0x000023d0..0x00002791 ( 962 items) : ../Release/0_0_reloadable24.o::_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E (Function, Weak, .text) (stack frame size = 384)
|
120 |
+
|
121 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
122 |
+
|
123 |
+
0x000027a0..0x00002987 ( 488 items) : ../Release/0_0_reloadable24.o::_Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE (Function, Global, .text) (stack frame size = 64)
|
124 |
+
|
125 |
+
Called functions : _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv
|
126 |
+
_ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E
|
127 |
+
|
128 |
+
Referenced symbols: _ZL9curr_iter
|
129 |
+
_ZL8core_row
|
130 |
+
tanh1d_params
|
131 |
+
_ZN12me_primitive11control_rndE
|
132 |
+
_ZN12me_primitive11control_satE
|
133 |
+
_ZL11ifm1_offset
|
134 |
+
_ZL8num_iter
|
135 |
+
|
136 |
+
0x00002990..0x00002a03 ( 116 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 0)
|
137 |
+
0x00002a10..0x00002a71 ( 98 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv (Function, Weak, .text) (stack frame size = 64)
|
138 |
+
|
139 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv
|
140 |
+
|
141 |
+
0x00002a80..0x00002a8f ( 16 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E (Function, Weak, .text) (stack frame size = 0)
|
142 |
+
|
143 |
+
Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
144 |
+
|
145 |
+
0x00002a90..0x00002ce9 ( 602 items) : ../Release/0_0_reloadable24.o::_Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
146 |
+
|
147 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv
|
148 |
+
_ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E
|
149 |
+
|
150 |
+
Referenced symbols: _ZL9curr_iter
|
151 |
+
_ZL8core_row
|
152 |
+
add1d_params
|
153 |
+
_ZN12me_primitive11control_rndE
|
154 |
+
_ZN12me_primitive11control_satE
|
155 |
+
_ZL11ifm1_offset
|
156 |
+
_ZL11ifm2_offset
|
157 |
+
_ZL8num_iter
|
158 |
+
|
159 |
+
0x00002cf0..0x00002d07 ( 24 items) : ../Release/0_0_reloadable24.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
160 |
+
0x00002d10..0x00002d99 ( 138 items) : ../Release/0_0_reloadable24.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
|
161 |
+
|
162 |
+
Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E
|
163 |
+
|
164 |
+
0x00002da0..0x00002ec3 ( 292 items) : ../Release/0_0_reloadable24.o::_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
165 |
+
|
166 |
+
Referenced symbols: _ZN12me_primitive11control_rndE
|
167 |
+
|
168 |
+
0x00002ed0..0x00003129 ( 602 items) : ../Release/0_0_reloadable24.o::_Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
169 |
+
|
170 |
+
Called functions : _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv
|
171 |
+
_ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E
|
172 |
+
|
173 |
+
Referenced symbols: _ZL9curr_iter
|
174 |
+
_ZL8core_row
|
175 |
+
mul1d_params
|
176 |
+
_ZN12me_primitive11control_rndE
|
177 |
+
_ZN12me_primitive11control_satE
|
178 |
+
_ZL11ifm1_offset
|
179 |
+
_ZL11ifm2_offset
|
180 |
+
_ZL8num_iter
|
181 |
+
|
182 |
+
0x00003130..0x000031a3 ( 116 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 0)
|
183 |
+
0x000031b0..0x000031f9 ( 74 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv (Function, Weak, .text) (stack frame size = 64)
|
184 |
+
|
185 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv
|
186 |
+
|
187 |
+
0x00003200..0x0000320f ( 16 items) : ../Release/0_0_reloadable24.o::_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E (Function, Weak, .text) (stack frame size = 0)
|
188 |
+
|
189 |
+
Called functions : _ZL19shared_run_backboneI8bfloat16L5act_t0EEKvPT_S4_S4_R27elementwise_binary_params_tI15shared_params_tIS3_EE
|
190 |
+
|
191 |
+
0x00003210..0x00003469 ( 602 items) : ../Release/0_0_reloadable24.o::_Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE (Function, Global, .text) (stack frame size = 64)
|
192 |
+
|
193 |
+
Called functions : _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv
|
194 |
+
_ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E
|
195 |
+
|
196 |
+
Referenced symbols: _ZL9curr_iter
|
197 |
+
_ZL8core_row
|
198 |
+
sub1d_params
|
199 |
+
_ZN12me_primitive11control_rndE
|
200 |
+
_ZN12me_primitive11control_satE
|
201 |
+
_ZL11ifm1_offset
|
202 |
+
_ZL11ifm2_offset
|
203 |
+
_ZL8num_iter
|
204 |
+
|
205 |
+
0x00003470..0x00003a9f ( 1584 items) : ../Release/0_0_reloadable24.o::_Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj (Function, Weak, .text) (stack frame size = 0)
|
206 |
+
|
207 |
+
Referenced symbols: __const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs
|
208 |
+
__const____Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj___coeffs_asymmetric
|
209 |
+
_ZN12me_primitive11control_rndE
|
210 |
+
|
211 |
+
0x00003aa0..0x00003c75 ( 470 items) : ../Release/0_0_reloadable24.o::_ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj (Function, Weak, .text) (stack frame size = 0)
|
212 |
+
|
213 |
+
Called functions : _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj
|
214 |
+
|
215 |
+
Referenced symbols: _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter
|
216 |
+
_ZN12me_primitive11control_satE
|
217 |
+
_ZN12me_primitive11control_rndE
|
218 |
+
_ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params
|
219 |
+
|
220 |
+
0x00003c80..0x00003c9f ( 32 items) : ../Release/0_0_reloadable24.o::_Z13_b853_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
221 |
+
|
222 |
+
Called functions : _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj
|
223 |
+
|
224 |
+
0x00003ca0..0x00003cc3 ( 36 items) : ../Release/0_0_reloadable24.o::_Z13_b896_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
225 |
+
|
226 |
+
Called functions : _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
227 |
+
|
228 |
+
0x00003cd0..0x00003cef ( 32 items) : ../Release/0_0_reloadable24.o::_Z14_b1638_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
229 |
+
|
230 |
+
Called functions : _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
231 |
+
|
232 |
+
0x00003cf0..0x00003d13 ( 36 items) : ../Release/0_0_reloadable24.o::_Z14_b1655_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
233 |
+
|
234 |
+
Called functions : _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
235 |
+
|
236 |
+
0x00003d20..0x00003d43 ( 36 items) : ../Release/0_0_reloadable24.o::_Z13_b891_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
237 |
+
|
238 |
+
Called functions : _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
239 |
+
|
240 |
+
0x00003d50..0x00003d6f ( 32 items) : ../Release/0_0_reloadable24.o::_Z14_b1672_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
241 |
+
|
242 |
+
Called functions : _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE
|
243 |
+
|
244 |
+
0x00003d70..0x00003d93 ( 36 items) : ../Release/0_0_reloadable24.o::_Z13_b886_wrapperPPv (Function, Global, .text) (stack frame size = 0)
|
245 |
+
|
246 |
+
Called functions : _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE
|
247 |
+
|
248 |
+
|
249 |
+
External symbols:
|
250 |
+
|
251 |
+
__dso_handle = 0x0
|
252 |
+
_ctors_end = 0x0
|
253 |
+
_ctors_start = 0x0
|
254 |
+
_dtors_end = 0x0
|
255 |
+
_dtors_start = 0x0
|
256 |
+
_pc_end = 0x3d94
|
257 |
+
_pc_start = 0x930
|
258 |
+
_sp_end_DM_stack = 0x7c400
|
259 |
+
_sp_start_DM_stack = 0x7bac0
|
260 |
+
|
261 |
+
Section summary for memory 'DM_stack':
|
262 |
+
|
263 |
+
.stack File
|
264 |
+
---------- ----------
|
265 |
+
2368
|
266 |
+
---------- ----------
|
267 |
+
2368 Total
|
268 |
+
|
269 |
+
Section summary for memory 'DMb':
|
270 |
+
|
271 |
+
.bss .data .rodata File
|
272 |
+
---------- ---------- ---------- ----------
|
273 |
+
928 4 92 ../Release/0_0_reloadable24.o
|
274 |
+
5 0 0 me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
275 |
+
---------- ---------- ---------- ----------
|
276 |
+
933 4 92 Total
|
277 |
+
|
278 |
+
Section summary for memory 'PM':
|
279 |
+
|
280 |
+
.text File
|
281 |
+
---------- ----------
|
282 |
+
13188 ../Release/0_0_reloadable24.o
|
283 |
+
---------- ----------
|
284 |
+
13188 Total
|
285 |
+
|
286 |
+
File summary:
|
287 |
+
|
288 |
+
../Release/0_0_reloadable24.o
|
289 |
+
DMb 1024
|
290 |
+
PM 13188
|
291 |
+
|
292 |
+
me_defs.o(/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release/libme.a)
|
293 |
+
DMb 5
|
294 |
+
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.sdr
ADDED
@@ -0,0 +1,125 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
// File generated by bridge version V-2024.06#84922c0d9f#241219, Fri Mar 21 04:03:20 2025
|
3 |
+
// Copyright 2014-2024 Synopsys, Inc. All rights reserved.
|
4 |
+
// bridge -o../Release/0_0_reloadable24 ../Release/0_0_reloadable24.o -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/isg -g -I/usr/local/lib/python3.10/dist-packages/include -I/app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend -I/usr/local/lib/python3.10/site-packages/include/aie_api -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common -I/usr/local/lib/python3.10/dist-packages/vitis_mllib -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc -I/usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf -I/app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/. -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/include -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libs/libcxx-9.0.0/include-lite -I/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/include -D__AIENGINE__ -D__AIE_ARCH__=21 -DDEPLOYMENT_ELF=1 -D__LOCK_FENCE_MODE__=0 -D__IO_BUFFER_FORCE_LIGHT_WEIGHT__ -DAIE_API_EMULATE_BFLOAT16_MMUL_WITH_BFP16=1 -DAIE_OPTION_SCALAR_FLOAT_ON_VECTOR -D__tct_tgt__=241219 -c0_0_reloadable24.bcf -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/softfloat/lib/Release -L/usr/local/lib/python3.10/dist-packages/data/aie2p/lib/runtime_cxx/libcxx-lite/lib/Release_LLVM -lme -lc -lm -lc++lite -lsoftfloat -S -export-locals -iconfig extra_memories.bcf -yTM -m -fC -fS -fH +m -T +work ../Release/chesswork6947 -pme
|
5 |
+
|
6 |
+
// Release: ipp V-2024.06-TGT-241219
|
7 |
+
|
8 |
+
// Symbols in memory 'DM_bankA':
|
9 |
+
// Symbols in memory 'DM_bankAB':
|
10 |
+
// Symbols in memory 'DM_bankAC':
|
11 |
+
// Symbols in memory 'DM_bankAD':
|
12 |
+
// Symbols in memory 'DM_bankB':
|
13 |
+
// Symbols in memory 'DM_bankBC':
|
14 |
+
// Symbols in memory 'DM_bankBD':
|
15 |
+
// Symbols in memory 'DM_bankC':
|
16 |
+
// Symbols in memory 'DM_bankCD':
|
17 |
+
// Symbols in memory 'DM_bankD':
|
18 |
+
// Symbols in memory 'DM_stack':
|
19 |
+
// Symbols in memory 'DM_test':
|
20 |
+
// Symbols in memory 'DMb':
|
21 |
+
_symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE8cur_iter 0x0007c45c
|
22 |
+
_symbol _ZN12me_primitive11control_satE 0x0007c464
|
23 |
+
_symbol _ZN12me_primitive11control_rndE 0x0007c468
|
24 |
+
_symbol add1d_params 0x0007c540
|
25 |
+
_symbol mul1d_params 0x0007c580
|
26 |
+
_symbol sub1d_params 0x0007c5c0
|
27 |
+
_symbol sigmoid1d_params 0x0007c600
|
28 |
+
_symbol tanh1d_params 0x0007c640
|
29 |
+
_symbol conv2d_params 0x0007c680
|
30 |
+
_symbol _ZZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_KjE6params 0x0007c840
|
31 |
+
// Symbols in memory 'DMh':
|
32 |
+
// Symbols in memory 'DMh_bankA':
|
33 |
+
// Symbols in memory 'DMh_bankAB':
|
34 |
+
// Symbols in memory 'DMh_bankAC':
|
35 |
+
// Symbols in memory 'DMh_bankAD':
|
36 |
+
// Symbols in memory 'DMh_bankB':
|
37 |
+
// Symbols in memory 'DMh_bankBC':
|
38 |
+
// Symbols in memory 'DMh_bankBD':
|
39 |
+
// Symbols in memory 'DMh_bankC':
|
40 |
+
// Symbols in memory 'DMh_bankCD':
|
41 |
+
// Symbols in memory 'DMh_bankD':
|
42 |
+
// Symbols in memory 'DMh_stack':
|
43 |
+
// Symbols in memory 'DMs':
|
44 |
+
// Symbols in memory 'DMs_bankA':
|
45 |
+
// Symbols in memory 'DMs_bankAB':
|
46 |
+
// Symbols in memory 'DMs_bankAC':
|
47 |
+
// Symbols in memory 'DMs_bankAD':
|
48 |
+
// Symbols in memory 'DMs_bankB':
|
49 |
+
// Symbols in memory 'DMs_bankBC':
|
50 |
+
// Symbols in memory 'DMs_bankBD':
|
51 |
+
// Symbols in memory 'DMs_bankC':
|
52 |
+
// Symbols in memory 'DMs_bankCD':
|
53 |
+
// Symbols in memory 'DMs_bankD':
|
54 |
+
// Symbols in memory 'DMs_stack':
|
55 |
+
// Symbols in memory 'DMv':
|
56 |
+
// Symbols in memory 'DMv_bankA':
|
57 |
+
// Symbols in memory 'DMv_bankAB':
|
58 |
+
// Symbols in memory 'DMv_bankAC':
|
59 |
+
// Symbols in memory 'DMv_bankAD':
|
60 |
+
// Symbols in memory 'DMv_bankB':
|
61 |
+
// Symbols in memory 'DMv_bankBC':
|
62 |
+
// Symbols in memory 'DMv_bankBD':
|
63 |
+
// Symbols in memory 'DMv_bankC':
|
64 |
+
// Symbols in memory 'DMv_bankCD':
|
65 |
+
// Symbols in memory 'DMv_bankD':
|
66 |
+
// Symbols in memory 'DMv_stack':
|
67 |
+
// Symbols in memory 'DMw':
|
68 |
+
// Symbols in memory 'DMw_bankA':
|
69 |
+
// Symbols in memory 'DMw_bankAB':
|
70 |
+
// Symbols in memory 'DMw_bankAC':
|
71 |
+
// Symbols in memory 'DMw_bankAD':
|
72 |
+
// Symbols in memory 'DMw_bankB':
|
73 |
+
// Symbols in memory 'DMw_bankBC':
|
74 |
+
// Symbols in memory 'DMw_bankBD':
|
75 |
+
// Symbols in memory 'DMw_bankC':
|
76 |
+
// Symbols in memory 'DMw_bankCD':
|
77 |
+
// Symbols in memory 'DMw_bankD':
|
78 |
+
// Symbols in memory 'DMw_stack':
|
79 |
+
// Symbols in memory 'DMx':
|
80 |
+
// Symbols in memory 'DMx_bankA':
|
81 |
+
// Symbols in memory 'DMx_bankAB':
|
82 |
+
// Symbols in memory 'DMx_bankAC':
|
83 |
+
// Symbols in memory 'DMx_bankAD':
|
84 |
+
// Symbols in memory 'DMx_bankB':
|
85 |
+
// Symbols in memory 'DMx_bankBC':
|
86 |
+
// Symbols in memory 'DMx_bankBD':
|
87 |
+
// Symbols in memory 'DMx_bankC':
|
88 |
+
// Symbols in memory 'DMx_bankCD':
|
89 |
+
// Symbols in memory 'DMx_bankD':
|
90 |
+
// Symbols in memory 'DMx_stack':
|
91 |
+
// Symbols in memory 'PM':
|
92 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x00000930
|
93 |
+
_symbol _Z24setup_conv2d_bf16_paramsILb1ELb0EEvPKjR18conv2d_bf16_paramshh 0x00000b60
|
94 |
+
_symbol _Z21convert_bf16_to_bfp16I8bfloat16Lb0EEvPT_PS0_RK13BfToBfpParams 0x00001100
|
95 |
+
_symbol _Z11conv2d_bf16ILh1EL5act_t0E8bfloat16S1_S1_N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_NS3_IS5_NS6_5asyncES9_SB_EELb0ELb0ELb1ELb0EEvRNS2_9io_bufferIT1_NS2_9direction2inET4_EERNSF_IT2_SI_T5_EERNSF_IT3_NSH_3outET6_EER18conv2d_bf16_params 0x00001210
|
96 |
+
_symbol _Z14conv2d_maxpoolRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEESF_RA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x00001b80
|
97 |
+
_symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00001fe0
|
98 |
+
_symbol _ZN17elementwise_unaryI8bfloat1619elementwise_sigmoidIS0_E26sigmoid_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x00002020
|
99 |
+
_symbol _Z21superkernel_sigmoid1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000021a0
|
100 |
+
_symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE5setupER26elementwise_unary_params_tIS4_EPKv 0x00002390
|
101 |
+
_symbol _ZN17elementwise_unaryI8bfloat1616elementwise_tanhIS0_E23tanh_templated_params_tIS0_EE3runEPS0_S6_R26elementwise_unary_params_tIS4_E 0x000023d0
|
102 |
+
_symbol _Z18superkernel_tanh1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_NS2_3outENS4_IS6_NS7_5asyncESA_SC_EEEE 0x000027a0
|
103 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE21shared_setup_backboneER27elementwise_binary_params_tIS5_EPKv 0x00002990
|
104 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE5setupER27elementwise_binary_params_tIS5_EPKv 0x00002a10
|
105 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168add_implIS0_L5act_t0EE15shared_params_tIS0_ELS2_0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS5_E 0x00002a80
|
106 |
+
_symbol _Z17superkernel_add1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002a90
|
107 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_E 0x00002cf0
|
108 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE5setupER27elementwise_binary_params_tIS4_EPKv 0x00002d10
|
109 |
+
_symbol _ZN18elementwise_binaryIJ8bfloat168mul_implIS0_E15shared_params_tIS0_EEE3runEPS0_S6_S6_R27elementwise_binary_params_tIS4_E 0x00002da0
|
110 |
+
_symbol _Z17superkernel_mul1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00002ed0
|
111 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE21shared_setup_backboneER27elementwise_binary_params_tIS4_EPKv 0x00003130
|
112 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE5setupER27elementwise_binary_params_tIS4_EPKv 0x000031b0
|
113 |
+
_symbol _ZN25elementwise_binary_sharedI8bfloat168sub_implIS0_E15shared_params_tIS0_EL5act_t0EE3runEPS0_S7_S7_R27elementwise_binary_params_tIS4_E 0x00003200
|
114 |
+
_symbol _Z17superkernel_sub1dRN3adf9io_bufferI8bfloat16NS_9direction2inENS_16io_buffer_configINS_7extentsIJEEENS_7locking4syncENS_10addressing6linearENS_6marginILj0EEEEEEERA16_KjRNS0_IS1_S3_NS4_IS6_NS7_5asyncESA_SC_EEEERNS0_IS1_NS2_3outESK_EE 0x00003210
|
115 |
+
_symbol _Z23resize_bilinear_scale_2I8bfloat16Qsr5mllib5utilsE11is_one_of_vIT_S0_EEvPS1_PfS2_jjjj 0x00003470
|
116 |
+
_symbol _ZN12mllib_graphs18resize_adf_wrapperI8bfloat16N3adf16io_buffer_configINS2_7extentsIJEEENS2_7locking4syncENS2_10addressing6linearENS2_6marginILj0EEEEESC_Li1ELi0ELi2EEEvRNS2_9io_bufferIT_NS2_9direction2inET0_EERNSD_ISE_NSF_3outET1_EERA16_Kj 0x00003aa0
|
117 |
+
_symbol _Z13_b853_wrapperPPv 0x00003c80
|
118 |
+
_symbol _Z13_b896_wrapperPPv 0x00003ca0
|
119 |
+
_symbol _Z14_b1638_wrapperPPv 0x00003cd0
|
120 |
+
_symbol _Z14_b1655_wrapperPPv 0x00003cf0
|
121 |
+
_symbol _Z13_b891_wrapperPPv 0x00003d20
|
122 |
+
_symbol _Z14_b1672_wrapperPPv 0x00003d50
|
123 |
+
_symbol _Z13_b886_wrapperPPv 0x00003d70
|
124 |
+
// Symbols in memory 'PMw':
|
125 |
+
// Symbols in memory 'TM4':
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.srv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/Release/0_2_reloadable24.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/scripts/0_2_reloadable24.bcf
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_reserved DMb 0x0 0x40000
|
2 |
+
|
3 |
+
_reserved PM 0x0 0x930 //reserved for main elf
|
4 |
+
|
5 |
+
_entry_point _Z13kernelWrapperPPvjjjj
|
6 |
+
_symbol _Z13kernelWrapperPPvjjjj 0x930
|
7 |
+
|
8 |
+
_reserved DMb 0x7b280 0x800 //reserved for lcp ping-pong buffers
|
9 |
+
_reserved DMb 0x7ba80 0x40 //reserved for sync buffer
|
10 |
+
_stack DM_stack 0x7bac0 0x940 //stack for core
|
11 |
+
_reserved DMb 0x7c400 0x40 //reserved for main elf heap
|
12 |
+
//space for synopsys compiler at 0x7c440 0x880//heap
|
13 |
+
_reserved DMb 0x40000 0x3b280
|
14 |
+
|
15 |
+
_reserved DMb 0x7ccc0 0x3340
|
16 |
+
_reserved DMb 0x80000 0x80000 // And everything else the core can't see
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/scripts/0_2_reloadable24.prx
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<project name="Project" processor="me">
|
2 |
+
<issinit/>
|
3 |
+
<option id="cpp.define" value="__AIENGINE__ __AIE_ARCH__=21" inherit = "1"/>
|
4 |
+
<option id="llvm.xargs" value="-fno-jump-tables -fno-discard-value-names" inherit = "1"/>
|
5 |
+
<option id="llvm.lang" value="Follow file extension"/>
|
6 |
+
<option id="bridge.cfg" value="0_2_reloadable24.bcf"/>
|
7 |
+
<option id="bridge.alibs" value=" ../Release/0_2_reloadable24.o" inherit="1" cfg="Release_LLVM"/>
|
8 |
+
<option id="cpp.include" value="<XILINX_VITIS_AIETOOLS>/include /app/vaiml_1.3_examples/camo/./segmentation_1_4_0_fp32_combined/vaiml_par_0/0/backend /usr/local/lib/python3.10/site-packages/include/aie_api /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/include/common /usr/local/lib/python3.10/dist-packages/vitis_mllib /usr/local/lib/python3.10/dist-packages/vitis_mllib/L1/include/misc /usr/local/lib/python3.10/dist-packages/vitis_mllib/L2/src/ml_adf /app/vaiml_1.3_examples/camo/segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/<AIE_SRC_DIR> " inherit="1"/>
|
9 |
+
<option id="project.dir" value="<CONFIG>/0_2_reloadable24"/>
|
10 |
+
<option id="project.name" value="0_2_reloadable24"/>
|
11 |
+
<option id="project.type" value="exe"/>
|
12 |
+
<option id="simrun.issca" value="<XILINX_VITIS_AIETOOLS>/bin/unwrapped/lnx64.o/aie2p/ca_udm_dbg" inherit="0"/>
|
13 |
+
</project>
|
segmentation_1_4_0_fp32_combined/vaiml_par_0/0/aiecompiler/Work/aie/0_2_reloadable24/src/0_2_reloadable24.cc
ADDED
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
// Automatically generated processor driver using AIEngine tool-chain
|
2 |
+
|
3 |
+
#include <stdio.h>
|
4 |
+
#include <memory>
|
5 |
+
#include <adf.h>
|
6 |
+
|
7 |
+
|
8 |
+
// Declare Kernel functions and initializers
|
9 |
+
#include "resize_adf_wrapper.cpp"
|
10 |
+
void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
11 |
+
void superkernel_sigmoid1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
12 |
+
void superkernel_sub1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
13 |
+
void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
14 |
+
void superkernel_tanh1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
15 |
+
void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict,const unsigned int (&)[16],adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict,adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict);
|
16 |
+
|
17 |
+
// Declare Kernel objects and external arrays
|
18 |
+
|
19 |
+
|
20 |
+
void _b853_wrapper(void* args[])
|
21 |
+
{
|
22 |
+
mllib_graphs::resize_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, 1, 0, 2>(
|
23 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
24 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
25 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]));
|
26 |
+
}
|
27 |
+
|
28 |
+
void _b896_wrapper(void* args[])
|
29 |
+
{
|
30 |
+
conv2d_maxpool(
|
31 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
32 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[1]),
|
33 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
34 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
35 |
+
}
|
36 |
+
|
37 |
+
void _b1638_wrapper(void* args[])
|
38 |
+
{
|
39 |
+
superkernel_sigmoid1d(
|
40 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
41 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]),
|
42 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
|
43 |
+
}
|
44 |
+
|
45 |
+
void _b1655_wrapper(void* args[])
|
46 |
+
{
|
47 |
+
superkernel_sub1d(
|
48 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
49 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
50 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
51 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
52 |
+
}
|
53 |
+
|
54 |
+
void _b891_wrapper(void* args[])
|
55 |
+
{
|
56 |
+
superkernel_mul1d(
|
57 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
58 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
59 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
60 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
61 |
+
}
|
62 |
+
|
63 |
+
void _b1672_wrapper(void* args[])
|
64 |
+
{
|
65 |
+
superkernel_tanh1d(
|
66 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
67 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[2]),
|
68 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]));
|
69 |
+
}
|
70 |
+
|
71 |
+
void _b886_wrapper(void* args[])
|
72 |
+
{
|
73 |
+
superkernel_add1d(
|
74 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_sync_0d>*>(args[0]),
|
75 |
+
*reinterpret_cast<uint32 const(*)[16]>(args[3]),
|
76 |
+
*reinterpret_cast<adf::input_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[1]),
|
77 |
+
*reinterpret_cast<adf::output_buffer_conf<bfloat16, adf::bpc_async_0d>*>(args[2]));
|
78 |
+
}
|
79 |
+
|
80 |
+
using UniformKernelFunc = void (*)(void **);
|
81 |
+
|
82 |
+
static UniformKernelFunc g_uniformKernelFuncs[7] = {
|
83 |
+
_b853_wrapper,
|
84 |
+
_b896_wrapper,
|
85 |
+
_b1638_wrapper,
|
86 |
+
_b1655_wrapper,
|
87 |
+
_b891_wrapper,
|
88 |
+
_b1672_wrapper,
|
89 |
+
_b886_wrapper
|
90 |
+
};
|
91 |
+
|
92 |
+
__attribute__((always_inline)) void kernelWrapper(void* args[], uint32 kernelId, uint32 numSyncIn, uint32 numAsyncIn, uint32 numSyncOut)
|
93 |
+
{
|
94 |
+
uint32 idx = 0;
|
95 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 0);
|
96 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
97 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::in>(numSyncIn > 1);
|
98 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
99 |
+
idx += numAsyncIn;
|
100 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->acquire<adf::direction::out>(numSyncOut > 0);
|
101 |
+
idx += (numSyncOut > 0) ? 1 : 0;
|
102 |
+
|
103 |
+
(*(g_uniformKernelFuncs[kernelId]))(args);
|
104 |
+
|
105 |
+
idx = 0;
|
106 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 0);
|
107 |
+
idx += (numSyncIn > 0) ? 1 : 0;
|
108 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::in>(numSyncIn > 1);
|
109 |
+
idx += (numSyncIn > 1) ? 1 : 0;
|
110 |
+
idx += numAsyncIn;
|
111 |
+
reinterpret_cast<adf::_io_buffer_light_weight_generic*>(args[idx])->release<adf::direction::out>(numSyncOut > 0);
|
112 |
+
idx += (numSyncOut > 0) ? 1 : 0;
|
113 |
+
}
|