Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1481.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1482.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1483.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1484.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1487.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1488.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1489.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_149.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1490.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1491.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1492.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1493.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1494.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1495.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1496.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1497.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1498.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1499.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1500.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1501.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1502.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1503.bin +3 -0
- vaiml_par_0/0/aiecompiler/Work/reports/report_pm.txt +0 -0
- vaiml_par_0/0/aiecompiler/Work/reports/report_stack.txt +0 -0
- vaiml_par_0/0/aiecompiler/Work/temp/kernel_stubs.h +32 -0
- vaiml_par_0/0/aiecompiler/Work/temp/top_partition.json +0 -0
- vaiml_par_0/0/backend/0.dag_before_general_L2L3_buffer_insertion.dot +0 -0
- vaiml_par_0/0/backend/1.dag_after_general_L2L3_buffer_insertion.dot +0 -0
- vaiml_par_0/0/backend/10.dag_after_TGOptimizeForO2.dot +0 -0
- vaiml_par_0/0/backend/11.dag_after_InactiveSpilling_pass_O2.dot +0 -0
- vaiml_par_0/0/backend/12.dag_after_TGNodeSpillingForO2_pass_O2.dot +0 -0
- vaiml_par_0/0/backend/13.dag_after_ReshapeHandlingPass.dot +0 -0
- vaiml_par_0/0/backend/14.dag_before_L2Placement.dot +0 -0
- vaiml_par_0/0/backend/15.dag_After_L2flushout.dot +0 -0
- vaiml_par_0/0/backend/16.dag_After_layerwisestamping.dot +0 -0
- vaiml_par_0/0/backend/17.dag_before_ADFgen.dot +0 -0
- vaiml_par_0/0/backend/2.dag_AfterL3concat_fanout.dot +0 -0
- vaiml_par_0/0/backend/3.dag_AfterTGtoConcatPass.dot +0 -0
- vaiml_par_0/0/backend/4.dag_AfterConcatoffsetComputePass.dot +0 -0
- vaiml_par_0/0/backend/5.dag_after_tg_pass.dot +0 -0
- vaiml_par_0/0/backend/6.dag_after_RemoveL2L3Buffer_pass_O2.dot +0 -0
- vaiml_par_0/0/backend/7.dag_after_AddControlEdge_pass_O2.dot +0 -0
- vaiml_par_0/0/backend/8.dag_after_ReplaceL3ByL2concat_pass_O2.dot +0 -0
- vaiml_par_0/0/backend/9.dag_after_L2_SpillFMOverflow_pass_O2.dot +0 -0
- vaiml_par_0/0/backend/BE_postcheck_log.txt +0 -0
- vaiml_par_0/0/backend/InactiveSpillingDebug_Dump_0.dot +0 -0
- vaiml_par_0/0/backend/TGNodeSpilling_Dump_0.dot +0 -0
- vaiml_par_0/0/backend/TGNodeSpilling_Dump_1.dot +0 -0
- vaiml_par_0/0/backend/TGNodeSpilling_Dump_10.dot +0 -0
- vaiml_par_0/0/backend/TGNodeSpilling_Dump_100.dot +0 -0
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1481.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02f23643b7fb3790cbaf3425e8080e698ee243d955f581ef3ef9cb42be0f75b2
|
3 |
+
size 384
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1482.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e746703685b9d674309ebd90c4eaa7ebb247bcae5ba24689aeb97ff3db961098
|
3 |
+
size 376
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1483.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f138c7be056a7fffdaefeca0d04b29e1f4504680888efeda4c615c73e0326d
|
3 |
+
size 264
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1484.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:befe49b6eb216d0687a361dfdaf6dc9020d90aebb0e257e8935dd5f9192daf96
|
3 |
+
size 348
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1487.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9b497ffdfdd8fa3a5897c165c6f5e7eebb2245d9c262fefa27ed48309822fc4
|
3 |
+
size 260
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1488.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e341d4e142f7922e6134ac8979076a1c87f3aa00817fc135424bd21bee97c53
|
3 |
+
size 244
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1489.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:503917d4e5a2f37d335b35f18211b1f9f407f7d4a169e2484e2534deb9fe2142
|
3 |
+
size 348
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_149.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:999ce13aca08dfc0364089a90d9f8d1d670878edab24f5e91e8d56a60e86a777
|
3 |
+
size 260
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1490.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2a1067a4e148fb4d772636ce1e2ff9fc58cfe42fa9b03d7d59b0fd70cd5d26e
|
3 |
+
size 296
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1491.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49d223ef3fce6fbed5560bd0c3d3023633b397d8614611b0d72f6ce69c90f1f2
|
3 |
+
size 376
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1492.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05804e71b0e897e153633f43bedc51408a1ed4d0cca5fa5eeaa056e3345ba822
|
3 |
+
size 244
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1493.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:621daab1b36b5b2d0d9f9d4e59098028a936921e423bb78f7d3cc257f7bc2f52
|
3 |
+
size 296
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1494.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59c33b8be639d270c6953c7ab6e7e1d2b5b402aad29960a032b71e0dec5af0c2
|
3 |
+
size 260
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1495.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cd8ea6aa61e10c4fc8b26fd085f4706bd314d0e5b957f144868b3521aaa9374
|
3 |
+
size 260
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1496.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d35c512706b8587ee71c3994802890e9dff3ce30f6e4de6016642c136d2247a
|
3 |
+
size 384
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1497.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95738b9d6328e4f5fc532c7cd6092e18b401c5d51c4b5337bbbd0180c4a37252
|
3 |
+
size 260
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1498.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05804e71b0e897e153633f43bedc51408a1ed4d0cca5fa5eeaa056e3345ba822
|
3 |
+
size 244
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1499.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65e40c435419ee1ac0d52925c1b51504a4f0844adc6311893ab7338471acb9bb
|
3 |
+
size 296
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1500.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d86d29759f2785bc9e5425bb6e581efeace13ace63114b99ae21b78a526ad62
|
3 |
+
size 296
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1501.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e98dde8600e0d949299a92243e5f91fea826235412df5f0e13a18f28cdf703e2
|
3 |
+
size 376
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1502.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72fa29e048525188268e47c416bdad632fc6255892cfb893f9e7655951f172b2
|
3 |
+
size 296
|
vaiml_par_0/0/aiecompiler/Work/aie/0_2/lcp/0_2_1503.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4999af9a4ada89c3c8ab3472cc09586b27611c63fd0eedf72f6a81937c66ed4a
|
3 |
+
size 260
|
vaiml_par_0/0/aiecompiler/Work/reports/report_pm.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/aiecompiler/Work/reports/report_stack.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/aiecompiler/Work/temp/kernel_stubs.h
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
template<typename dtype, typename config_ifm, typename config_ofm> void mllib_graphs::buffer_pad_adf_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm, const uint32_t (&layer_params)[3]) { /* Stub */ }
|
2 |
+
template<typename dtype, typename config_ifm, typename config_ofm> void mllib_graphs::buffer_unpad_adf_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm, const uint32_t (&layer_params)[3]) { /* Stub */ }
|
3 |
+
template<typename dtype, typename config_ifm, typename config_ofm> void mllib_graphs::slice_generic_innermost_adf_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm, const uint32_t (&lp)[16]) { /* Stub */ }
|
4 |
+
template<typename dtype, typename config_ifm, typename config_ofm> void mllib_graphs::softmax_adf_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, const uint32_t (&layer_params)[8], adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm) { /* Stub */ }
|
5 |
+
template<typename dtype, typename config_ifm, typename config_ofm> void mllib_graphs::transpose4d_adf_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm, const uint32_t (&layer_params)[7]) { /* Stub */ }
|
6 |
+
template<typename dtype, typename config_ifm, typename config_wts, typename config_ofm> void mllib_graphs::rmsnorm_row_major_part1_4x4_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, adf::input_buffer_conf<dtype, config_wts> &__restrict wts, const uint32_t (&layer_params)[11], adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm) { /* Stub */ }
|
7 |
+
template<typename dtype, typename config_ifm, typename config_wts, typename config_ofm> void mllib_graphs::rmsnorm_row_major_part2_4x4_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, adf::input_buffer_conf<dtype, config_wts> &__restrict wts, const uint32_t (&layer_params)[11], adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm) { /* Stub */ }
|
8 |
+
template<typename dtype, typename config_ifm, typename config_wts, typename config_ofm> void mllib_graphs::rmsnorm_row_major_part3_4x4_wrapper(adf::input_buffer_conf<dtype, config_ifm> &__restrict ifm, adf::input_buffer_conf<dtype, config_wts> &__restrict wts, const uint32_t (&layer_params)[11], adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm) { /* Stub */ }
|
9 |
+
template<typename dtype, typename config_ifm1, typename config_ifm2, typename config_ofm> void mllib_graphs::concat_adf_wrapper(adf::input_buffer_conf<dtype, config_ifm1> &__restrict ifm1, adf::input_buffer_conf<dtype, config_ifm2> &__restrict ifm2, adf::output_buffer_conf<dtype, config_ofm> &__restrict ofm, const uint32_t (&layer_params)[9]) { /* Stub */ }
|
10 |
+
template<typename dtype> void mllib_graphs::expand_wrapper(adf::input_buffer_conf<dtype, adf::bpc_sync_0d> &__restrict ifm, const uint32_t (&lp)[3], adf::output_buffer_conf<dtype, adf::bpc_sync_0d> &__restrict ofm) { /* Stub */ }
|
11 |
+
template<typename dtype_io, typename dtype_wts, typename config_ifm, typename config_wts, typename config_ofm> void gather_elements_adf_wrapper(adf::input_buffer_conf<dtype_io, config_ifm> &__restrict ifm, adf::input_buffer_conf<dtype_wts, config_wts> &__restrict wts, const uint32_t (&layer_params)[16], adf::output_buffer_conf<dtype_io, config_ofm> &__restrict ofm) { /* Stub */ }
|
12 |
+
void conv2d_maxpool(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
13 |
+
void superkernel_GemmBfp16(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[7], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
14 |
+
void superkernel_add1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
15 |
+
void superkernel_add1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
16 |
+
void superkernel_conv2d_dwc(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
17 |
+
void superkernel_mul1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
18 |
+
void superkernel_mul1d_attribute_broadcasting(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
19 |
+
void superkernel_reducesum(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[18], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
20 |
+
void superkernel_sigmoid1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
21 |
+
void superkernel_sub1d(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict) { /* Stub */ }
|
22 |
+
template void gather_elements_adf_wrapper<bfloat16, int, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<int, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict); /* explicit template instantiation */
|
23 |
+
template void mllib_graphs::buffer_pad_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[3]); /* explicit template instantiation */
|
24 |
+
template void mllib_graphs::buffer_unpad_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[3]); /* explicit template instantiation */
|
25 |
+
template void mllib_graphs::concat_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[9]); /* explicit template instantiation */
|
26 |
+
template void mllib_graphs::expand_wrapper<bfloat16>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[3], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict); /* explicit template instantiation */
|
27 |
+
template void mllib_graphs::rmsnorm_row_major_part1_4x4_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>, adf::locking::async>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[11], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>, adf::locking::async>> &__restrict); /* explicit template instantiation */
|
28 |
+
template void mllib_graphs::rmsnorm_row_major_part2_4x4_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[11], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict); /* explicit template instantiation */
|
29 |
+
template void mllib_graphs::rmsnorm_row_major_part3_4x4_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[11], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict); /* explicit template instantiation */
|
30 |
+
template void mllib_graphs::slice_generic_innermost_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[16]); /* explicit template instantiation */
|
31 |
+
template void mllib_graphs::softmax_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[8], adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict); /* explicit template instantiation */
|
32 |
+
template void mllib_graphs::transpose4d_adf_wrapper<bfloat16, adf::io_buffer_config<adf::extents<>>, adf::io_buffer_config<adf::extents<>>>(adf::io_buffer<bfloat16, adf::direction::in, adf::io_buffer_config<adf::extents<>>> &__restrict, adf::io_buffer<bfloat16, adf::direction::out, adf::io_buffer_config<adf::extents<>>> &__restrict, const unsigned int (&)[7]); /* explicit template instantiation */
|
vaiml_par_0/0/aiecompiler/Work/temp/top_partition.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/0.dag_before_general_L2L3_buffer_insertion.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/1.dag_after_general_L2L3_buffer_insertion.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/10.dag_after_TGOptimizeForO2.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/11.dag_after_InactiveSpilling_pass_O2.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/12.dag_after_TGNodeSpillingForO2_pass_O2.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/13.dag_after_ReshapeHandlingPass.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/14.dag_before_L2Placement.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/15.dag_After_L2flushout.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/16.dag_After_layerwisestamping.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/17.dag_before_ADFgen.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/2.dag_AfterL3concat_fanout.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/3.dag_AfterTGtoConcatPass.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/4.dag_AfterConcatoffsetComputePass.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/5.dag_after_tg_pass.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/6.dag_after_RemoveL2L3Buffer_pass_O2.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/7.dag_after_AddControlEdge_pass_O2.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/8.dag_after_ReplaceL3ByL2concat_pass_O2.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/9.dag_after_L2_SpillFMOverflow_pass_O2.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/BE_postcheck_log.txt
ADDED
File without changes
|
vaiml_par_0/0/backend/InactiveSpillingDebug_Dump_0.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/TGNodeSpilling_Dump_0.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/TGNodeSpilling_Dump_1.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/TGNodeSpilling_Dump_10.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vaiml_par_0/0/backend/TGNodeSpilling_Dump_100.dot
ADDED
The diff for this file is too large to render.
See raw diff
|
|