File size: 14,873 Bytes
b39425e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 |
#loc = loc(unknown)
module attributes {
llvm.data_layout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128",
llvm.target_triple = "x86_64-unknown-linux-gnu",
"onnx-mlir.symbol-postfix" = "onnxmodel.onnx.mlir",
vaimlconf.device = "stx",
vaimlconf.device_models = "${vaimlconf.install_dir}/data/deviceModels",
vaimlconf.install_dir = "/usr/local/lib/python3.10/dist-packages/flexml/flexml_extras",
vaimlconf.library_metadata = ["${vaimlconf.install_dir}/data/libraryMetadata/L1", "${vaimlconf.install_dir}/data/libraryMetadata/L2", "${vaimlconf.install_dir}/../../vitis_mllib/L1/metadata", "${vaimlconf.install_dir}/../../vitis_mllib/L2/metadata", "${vaimlconf.install_dir}/share/microkernel-tiling/tiling-recipe-specs"],
vaimlconf.single_core_compiler = "chess"} {
func.func private @forward_outlined_part_0(tensor<1x180x320x4xbf16>, tensor<1x16x90x160xbf16>, tensor<1x20x45x80xbf16>, tensor<1x40x23x40xbf16>, tensor<1x64x12x20xbf16>) -> (tensor<1x16x90x160xbf16>, tensor<1x20x45x80xbf16>, tensor<1x40x23x40xbf16>, tensor<1x64x12x20xbf16>, tensor<1x3x180x320xbf16>, tensor<1x1x180x320xbf16>) attributes {aie_partition = 0 : i32, kernel} loc(#loc319)
func.func @forward(%arg0: tensor<1x180x320x4xui8> {onnx.name = "src"} loc(unknown), %arg1: tensor<1x90x160x16xbf16> {onnx.name = "r1i"} loc(unknown), %arg2: tensor<1x45x80x20xbf16> {onnx.name = "r2i"} loc(unknown), %arg3: tensor<1x23x40x40xbf16> {onnx.name = "r3i"} loc(unknown), %arg4: tensor<1x12x20x64xbf16> {onnx.name = "r4i"} loc(unknown)) -> (tensor<1x180x320x3xbf16> {onnx.name = "fgr"}, tensor<1x180x320x1xbf16> {onnx.name = "pha"}, tensor<1x90x160x16xbf16> {onnx.name = "r1o"}, tensor<1x45x80x20xbf16> {onnx.name = "r2o"}, tensor<1x23x40x40xbf16> {onnx.name = "r3o"}, tensor<1x12x20x64xbf16> {onnx.name = "r4o"}) {
%0 = "tosa.const"() <{value = dense<[0, 2, 3, 1]> : tensor<4xi32>}> : () -> tensor<4xi32> loc(#loc)
%1 = "tosa.const"() <{value = dense<[0, 3, 1, 2]> : tensor<4xi32>}> : () -> tensor<4xi32> loc(#loc)
%2 = tosa.transpose %arg1, %1 : (tensor<1x90x160x16xbf16>, tensor<4xi32>) -> tensor<1x16x90x160xbf16> loc(#loc308)
%3 = tosa.transpose %arg2, %1 : (tensor<1x45x80x20xbf16>, tensor<4xi32>) -> tensor<1x20x45x80xbf16> loc(#loc309)
%4 = tosa.transpose %arg3, %1 : (tensor<1x23x40x40xbf16>, tensor<4xi32>) -> tensor<1x40x23x40xbf16> loc(#loc310)
%5 = tosa.cast %arg0 {LayerName = "Cast_0", OutputName = "Cast_0"} : (tensor<1x180x320x4xui8>) -> tensor<1x180x320x4xbf16> loc(#loc311)
%6 = tosa.transpose %arg4, %1 : (tensor<1x12x20x64xbf16>, tensor<4xi32>) -> tensor<1x64x12x20xbf16> loc(#loc312)
%7:6 = call @forward_outlined_part_0(%5, %2, %3, %4, %6) : (tensor<1x180x320x4xbf16>, tensor<1x16x90x160xbf16>, tensor<1x20x45x80xbf16>, tensor<1x40x23x40xbf16>, tensor<1x64x12x20xbf16>) -> (tensor<1x16x90x160xbf16>, tensor<1x20x45x80xbf16>, tensor<1x40x23x40xbf16>, tensor<1x64x12x20xbf16>, tensor<1x3x180x320xbf16>, tensor<1x1x180x320xbf16>) loc(#loc319)
%8 = tosa.transpose %7#4, %0 : (tensor<1x3x180x320xbf16>, tensor<4xi32>) -> tensor<1x180x320x3xbf16> loc(#loc313)
%9 = tosa.transpose %7#3, %0 : (tensor<1x64x12x20xbf16>, tensor<4xi32>) -> tensor<1x12x20x64xbf16> loc(#loc314)
%10 = tosa.transpose %7#2, %0 : (tensor<1x40x23x40xbf16>, tensor<4xi32>) -> tensor<1x23x40x40xbf16> loc(#loc315)
%11 = tosa.transpose %7#1, %0 : (tensor<1x20x45x80xbf16>, tensor<4xi32>) -> tensor<1x45x80x20xbf16> loc(#loc316)
%12 = tosa.transpose %7#0, %0 : (tensor<1x16x90x160xbf16>, tensor<4xi32>) -> tensor<1x90x160x16xbf16> loc(#loc317)
%13 = tosa.reshape %7#5 {new_shape = array<i64: 1, 180, 320, 1>} : (tensor<1x1x180x320xbf16>) -> tensor<1x180x320x1xbf16> loc(#loc318)
return %8, %13, %12, %11, %10, %9 : tensor<1x180x320x3xbf16>, tensor<1x180x320x1xbf16>, tensor<1x90x160x16xbf16>, tensor<1x45x80x20xbf16>, tensor<1x23x40x40xbf16>, tensor<1x12x20x64xbf16> loc(#loc)
} loc(#loc)
} loc(#loc)
#loc1 = loc("Div_2")
#loc2 = loc("Sub_431")
#loc3 = loc("Sub_411")
#loc4 = loc("Sub_385")
#loc5 = loc("Sub_359")
#loc6 = loc("Div_16")
#loc7 = loc("Sub_14")
#loc8 = loc("Initializer_398")
#loc9 = loc("Slice_7")
#loc10 = loc("CompilerGeneratedLoc")
#loc11 = loc("Add_445")
#loc12 = loc("AveragePool_346")
#loc13 = loc("AveragePool_347")
#loc14 = loc("AveragePool_348")
#loc15 = loc("Conv_17")
#loc16 = loc("Add_19")
#loc17 = loc("Clip_22")
#loc18 = loc("Div_24")
#loc19 = loc("Mul_25")
#loc20 = loc("Conv_26")
#loc21 = loc("Relu_27")
#loc22 = loc("Conv_28")
#loc23 = loc("Add_29")
#loc24 = loc("Conv_30")
#loc25 = loc("Relu_31")
#loc26 = loc("Conv_32")
#loc27 = loc("Relu_33")
#loc28 = loc("Conv_34")
#loc29 = loc("Conv_35")
#loc30 = loc("Relu_36")
#loc31 = loc("Conv_37")
#loc32 = loc("Relu_38")
#loc33 = loc("Conv_39")
#loc34 = loc("Add_40")
#loc35 = loc("Conv_41")
#loc36 = loc("Relu_42")
#loc37 = loc("Conv_43")
#loc38 = loc("Relu_44")
#loc39 = loc("GlobalAveragePool_45")
#loc40 = loc("Conv_46")
#loc41 = loc("Relu_47")
#loc42 = loc("Conv_48")
#loc43 = loc("Add_50")
#loc44 = loc("Clip_53")
#loc45 = loc("Div_55")
#loc46 = loc("Mul_56")
#loc47 = loc("Conv_57")
#loc48 = loc("Conv_58")
#loc49 = loc("Relu_59")
#loc50 = loc("Conv_60")
#loc51 = loc("Relu_61")
#loc52 = loc("GlobalAveragePool_62")
#loc53 = loc("Conv_63")
#loc54 = loc("Relu_64")
#loc55 = loc("Conv_65")
#loc56 = loc("Add_67")
#loc57 = loc("Clip_70")
#loc58 = loc("Div_72")
#loc59 = loc("Mul_73")
#loc60 = loc("Conv_74")
#loc61 = loc("Add_75")
#loc62 = loc("Conv_76")
#loc63 = loc("Relu_77")
#loc64 = loc("Conv_78")
#loc65 = loc("Relu_79")
#loc66 = loc("GlobalAveragePool_80")
#loc67 = loc("Conv_81")
#loc68 = loc("Relu_82")
#loc69 = loc("Conv_83")
#loc70 = loc("Add_85")
#loc71 = loc("Clip_88")
#loc72 = loc("Div_90")
#loc73 = loc("Mul_91")
#loc74 = loc("Conv_92")
#loc75 = loc("Add_93")
#loc76 = loc("Conv_94")
#loc77 = loc("Add_96")
#loc78 = loc("Clip_99")
#loc79 = loc("Div_101")
#loc80 = loc("Mul_102")
#loc81 = loc("Conv_103")
#loc82 = loc("Add_105")
#loc83 = loc("Clip_108")
#loc84 = loc("Div_110")
#loc85 = loc("Mul_111")
#loc86 = loc("Conv_112")
#loc87 = loc("Conv_113")
#loc88 = loc("Add_115")
#loc89 = loc("Clip_118")
#loc90 = loc("Div_120")
#loc91 = loc("Mul_121")
#loc92 = loc("Conv_122")
#loc93 = loc("Add_124")
#loc94 = loc("Clip_127")
#loc95 = loc("Div_129")
#loc96 = loc("Mul_130")
#loc97 = loc("Conv_131")
#loc98 = loc("Add_132")
#loc99 = loc("Conv_133")
#loc100 = loc("Add_135")
#loc101 = loc("Clip_138")
#loc102 = loc("Div_140")
#loc103 = loc("Mul_141")
#loc104 = loc("Conv_142")
#loc105 = loc("Add_144")
#loc106 = loc("Clip_147")
#loc107 = loc("Div_149")
#loc108 = loc("Mul_150")
#loc109 = loc("Conv_151")
#loc110 = loc("Add_152")
#loc111 = loc("Conv_153")
#loc112 = loc("Add_155")
#loc113 = loc("Clip_158")
#loc114 = loc("Div_160")
#loc115 = loc("Mul_161")
#loc116 = loc("Conv_162")
#loc117 = loc("Add_164")
#loc118 = loc("Clip_167")
#loc119 = loc("Div_169")
#loc120 = loc("Mul_170")
#loc121 = loc("Conv_171")
#loc122 = loc("Add_172")
#loc123 = loc("Conv_173")
#loc124 = loc("Add_175")
#loc125 = loc("Clip_178")
#loc126 = loc("Div_180")
#loc127 = loc("Mul_181")
#loc128 = loc("Conv_182")
#loc129 = loc("Add_184")
#loc130 = loc("Clip_187")
#loc131 = loc("Div_189")
#loc132 = loc("Mul_190")
#loc133 = loc("GlobalAveragePool_191")
#loc134 = loc("Conv_192")
#loc135 = loc("Relu_193")
#loc136 = loc("Conv_194")
#loc137 = loc("Add_196")
#loc138 = loc("Clip_199")
#loc139 = loc("Div_201")
#loc140 = loc("Mul_202")
#loc141 = loc("Conv_203")
#loc142 = loc("Conv_204")
#loc143 = loc("Add_206")
#loc144 = loc("Clip_209")
#loc145 = loc("Div_211")
#loc146 = loc("Mul_212")
#loc147 = loc("Conv_213")
#loc148 = loc("Add_215")
#loc149 = loc("Clip_218")
#loc150 = loc("Div_220")
#loc151 = loc("Mul_221")
#loc152 = loc("GlobalAveragePool_222")
#loc153 = loc("Conv_223")
#loc154 = loc("Relu_224")
#loc155 = loc("Conv_225")
#loc156 = loc("Add_227")
#loc157 = loc("Clip_230")
#loc158 = loc("Div_232")
#loc159 = loc("Mul_233")
#loc160 = loc("Conv_234")
#loc161 = loc("Add_235")
#loc162 = loc("Conv_236")
#loc163 = loc("Add_238")
#loc164 = loc("Clip_241")
#loc165 = loc("Div_243")
#loc166 = loc("Mul_244")
#loc167 = loc("Conv_245")
#loc168 = loc("Add_247")
#loc169 = loc("Clip_250")
#loc170 = loc("Div_252")
#loc171 = loc("Mul_253")
#loc172 = loc("GlobalAveragePool_254")
#loc173 = loc("Conv_255")
#loc174 = loc("Relu_256")
#loc175 = loc("Conv_257")
#loc176 = loc("Add_259")
#loc177 = loc("Clip_262")
#loc178 = loc("Div_264")
#loc179 = loc("Mul_265")
#loc180 = loc("Conv_266")
#loc181 = loc("Conv_267")
#loc182 = loc("Add_269")
#loc183 = loc("Clip_272")
#loc184 = loc("Div_274")
#loc185 = loc("Mul_275")
#loc186 = loc("Conv_276")
#loc187 = loc("Add_278")
#loc188 = loc("Clip_281")
#loc189 = loc("Div_283")
#loc190 = loc("Mul_284")
#loc191 = loc("GlobalAveragePool_285")
#loc192 = loc("Conv_286")
#loc193 = loc("Relu_287")
#loc194 = loc("Conv_288")
#loc195 = loc("Add_290")
#loc196 = loc("Clip_293")
#loc197 = loc("Div_295")
#loc198 = loc("Mul_296")
#loc199 = loc("Conv_297")
#loc200 = loc("Add_298")
#loc201 = loc("Conv_299")
#loc202 = loc("Add_301")
#loc203 = loc("Clip_304")
#loc204 = loc("Div_306")
#loc205 = loc("Mul_307")
#loc206 = loc("Conv_308")
#loc207 = loc("Add_310")
#loc208 = loc("Clip_313")
#loc209 = loc("Div_315")
#loc210 = loc("Mul_316")
#loc211 = loc("GlobalAveragePool_317")
#loc212 = loc("Conv_318")
#loc213 = loc("Relu_319")
#loc214 = loc("Conv_320")
#loc215 = loc("Add_322")
#loc216 = loc("Clip_325")
#loc217 = loc("Div_327")
#loc218 = loc("Mul_328")
#loc219 = loc("Conv_329")
#loc220 = loc("Add_330")
#loc221 = loc("Conv_331")
#loc222 = loc("Add_333")
#loc223 = loc("Clip_336")
#loc224 = loc("Div_338")
#loc225 = loc("Mul_339")
#loc226 = loc("GlobalAveragePool_342")
#loc227 = loc("Conv_343")
#loc228 = loc("Sigmoid_344")
#loc229 = loc("Mul_345")
#loc230 = loc("Conv_340")
#loc231 = loc("Relu_341")
#loc232 = loc("Split_349")
#loc233 = loc("Concat_350")
#loc234 = loc("Conv_351")
#loc235 = loc("Sigmoid_352")
#loc236 = loc("Split_353")
#loc237 = loc("Mul_360")
#loc238 = loc("Mul_354")
#loc239 = loc("Concat_355")
#loc240 = loc("Conv_356")
#loc241 = loc("Tanh_357")
#loc242 = loc("Mul_361")
#loc243 = loc("Add_362")
#loc244 = loc("Concat_363")
#loc245 = loc("Resize_365")
#loc246 = loc("Slice_371")
#loc247 = loc("Concat_372")
#loc248 = loc("Conv_373")
#loc249 = loc("Relu_374")
#loc250 = loc("Split_375")
#loc251 = loc("Concat_376")
#loc252 = loc("Conv_377")
#loc253 = loc("Sigmoid_378")
#loc254 = loc("Split_379")
#loc255 = loc("Mul_386")
#loc256 = loc("Mul_380")
#loc257 = loc("Concat_381")
#loc258 = loc("Conv_382")
#loc259 = loc("Tanh_383")
#loc260 = loc("Mul_387")
#loc261 = loc("Add_388")
#loc262 = loc("Concat_389")
#loc263 = loc("Resize_391")
#loc264 = loc("Slice_397")
#loc265 = loc("Concat_398")
#loc266 = loc("Conv_399")
#loc267 = loc("Relu_400")
#loc268 = loc("Split_401")
#loc269 = loc("Concat_402")
#loc270 = loc("Conv_403")
#loc271 = loc("Sigmoid_404")
#loc272 = loc("Split_405")
#loc273 = loc("Mul_412")
#loc274 = loc("Mul_406")
#loc275 = loc("Concat_407")
#loc276 = loc("Conv_408")
#loc277 = loc("Tanh_409")
#loc278 = loc("Mul_413")
#loc279 = loc("Add_414")
#loc280 = loc("Concat_415")
#loc281 = loc("Resize_417")
#loc282 = loc("Concat_418")
#loc283 = loc("Conv_419")
#loc284 = loc("Relu_420")
#loc285 = loc("Split_421")
#loc286 = loc("Concat_422")
#loc287 = loc("Conv_423")
#loc288 = loc("Sigmoid_424")
#loc289 = loc("Split_425")
#loc290 = loc("Mul_432")
#loc291 = loc("Mul_426")
#loc292 = loc("Concat_427")
#loc293 = loc("Conv_428")
#loc294 = loc("Tanh_429")
#loc295 = loc("Mul_433")
#loc296 = loc("Add_434")
#loc297 = loc("Concat_435")
#loc298 = loc("Resize_437")
#loc299 = loc("Concat_438")
#loc300 = loc("Conv_439")
#loc301 = loc("Relu_440")
#loc302 = loc("Conv_441")
#loc303 = loc("Relu_442")
#loc304 = loc("Conv_443")
#loc305 = loc("Split_444")
#loc306 = loc("Clip_446")
#loc307 = loc("Clip_447")
#loc308 = loc("Transpose_9")
#loc309 = loc("Transpose_10")
#loc310 = loc("Transpose_11")
#loc311 = loc("Cast_0")
#loc312 = loc("Transpose_12")
#loc313 = loc("Transpose_452")
#loc314 = loc("Transpose_451")
#loc315 = loc("Transpose_450")
#loc316 = loc("Transpose_449")
#loc317 = loc("Transpose_448")
#loc318 = loc("Transpose_453")
#loc319 = loc(fused[#loc1, #loc2, #loc3, #loc4, #loc5, #loc6, #loc7, #loc8, #loc9, #loc10, #loc11, #loc12, #loc13, #loc14, #loc15, #loc16, #loc17, #loc18, #loc19, #loc20, #loc21, #loc22, #loc23, #loc24, #loc25, #loc26, #loc27, #loc28, #loc29, #loc30, #loc31, #loc32, #loc33, #loc34, #loc35, #loc36, #loc37, #loc38, #loc39, #loc40, #loc41, #loc42, #loc43, #loc44, #loc45, #loc46, #loc47, #loc48, #loc49, #loc50, #loc51, #loc52, #loc53, #loc54, #loc55, #loc56, #loc57, #loc58, #loc59, #loc60, #loc61, #loc62, #loc63, #loc64, #loc65, #loc66, #loc67, #loc68, #loc69, #loc70, #loc71, #loc72, #loc73, #loc74, #loc75, #loc76, #loc77, #loc78, #loc79, #loc80, #loc81, #loc82, #loc83, #loc84, #loc85, #loc86, #loc87, #loc88, #loc89, #loc90, #loc91, #loc92, #loc93, #loc94, #loc95, #loc96, #loc97, #loc98, #loc99, #loc100, #loc101, #loc102, #loc103, #loc104, #loc105, #loc106, #loc107, #loc108, #loc109, #loc110, #loc111, #loc112, #loc113, #loc114, #loc115, #loc116, #loc117, #loc118, #loc119, #loc120, #loc121, #loc122, #loc123, #loc124, #loc125, #loc126, #loc127, #loc128, #loc129, #loc130, #loc131, #loc132, #loc133, #loc134, #loc135, #loc136, #loc137, #loc138, #loc139, #loc140, #loc141, #loc142, #loc143, #loc144, #loc145, #loc146, #loc147, #loc148, #loc149, #loc150, #loc151, #loc152, #loc153, #loc154, #loc155, #loc156, #loc157, #loc158, #loc159, #loc160, #loc161, #loc162, #loc163, #loc164, #loc165, #loc166, #loc167, #loc168, #loc169, #loc170, #loc171, #loc172, #loc173, #loc174, #loc175, #loc176, #loc177, #loc178, #loc179, #loc180, #loc181, #loc182, #loc183, #loc184, #loc185, #loc186, #loc187, #loc188, #loc189, #loc190, #loc191, #loc192, #loc193, #loc194, #loc195, #loc196, #loc197, #loc198, #loc199, #loc200, #loc201, #loc202, #loc203, #loc204, #loc205, #loc206, #loc207, #loc208, #loc209, #loc210, #loc211, #loc212, #loc213, #loc214, #loc215, #loc216, #loc217, #loc218, #loc219, #loc220, #loc221, #loc222, #loc223, #loc224, #loc225, #loc226, #loc227, #loc228, #loc229, #loc230, #loc231, #loc232, #loc233, #loc234, #loc235, #loc236, #loc237, #loc238, #loc239, #loc240, #loc241, #loc242, #loc243, #loc244, #loc245, #loc246, #loc247, #loc248, #loc249, #loc250, #loc251, #loc252, #loc253, #loc254, #loc255, #loc256, #loc257, #loc258, #loc259, #loc260, #loc261, #loc262, #loc263, #loc264, #loc265, #loc266, #loc267, #loc268, #loc269, #loc270, #loc271, #loc272, #loc273, #loc274, #loc275, #loc276, #loc277, #loc278, #loc279, #loc280, #loc281, #loc282, #loc283, #loc284, #loc285, #loc286, #loc287, #loc288, #loc289, #loc290, #loc291, #loc292, #loc293, #loc294, #loc295, #loc296, #loc297, #loc298, #loc299, #loc300, #loc301, #loc302, #loc303, #loc304, #loc305, #loc306, #loc307])
|