Skip to content

Instantly share code, notes, and snippets.

@BeMg
Last active August 21, 2019 06:55
Show Gist options
  • Save BeMg/342c3a3b4cdd561492a199295cb68080 to your computer and use it in GitHub Desktop.
Save BeMg/342c3a3b4cdd561492a199295cb68080 to your computer and use it in GitHub Desktop.
.text
.file "fuse_reshape"
.globl fuse_reshape # -- Begin function fuse_reshape
.p2align 2
.type fuse_reshape,@function
fuse_reshape: # @fuse_reshape
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -16
.cfi_def_cfa_offset 16
sd ra, 8(sp)
sd s0, 0(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB0_38
# %bb.1: # %assert_end
lwu t2, 4(a1)
ld a2, 8(a0)
lwu t3, 0(a1)
ld a5, 0(a0)
ld a7, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB0_4
# %bb.2: # %if_then
lw a3, 0(a0)
addi s0, zero, 784
bne a3, s0, .LBB0_39
# %bb.3: # %if_then
ld a0, 8(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a3, zero, 1
bne a0, a3, .LBB0_39
.LBB0_4: # %if_end
ld t0, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld a3, 32(a2)
beqz a3, .LBB0_9
# %bb.5: # %if_then3
lw a4, 0(a3)
addi s0, zero, 784
bne a4, s0, .LBB0_40
# %bb.6: # %if_then3
ld a4, 8(a3)
slli a4, a4, 32
srli a4, a4, 32
bne a4, s0, .LBB0_40
# %bb.7: # %if_then3
ld a4, 16(a3)
slli a4, a4, 32
srli a4, a4, 32
addi s0, zero, 28
bne a4, s0, .LBB0_40
# %bb.8: # %if_then3
ld a3, 24(a3)
slli a3, a3, 32
srli a3, a3, 32
addi a4, zero, 1
bne a3, a4, .LBB0_40
.LBB0_9: # %if_end4
addi a3, zero, 13
bltu a3, t3, .LBB0_33
# %bb.10: # %if_end4
addi a3, zero, 1
sll a3, a3, t3
lui a4, 2
addiw a4, a4, 152
and a3, a3, a4
beqz a3, .LBB0_33
# %bb.11: # %assert_end8
addi a3, zero, 13
bltu a3, t2, .LBB0_34
# %bb.12: # %assert_end8
addi a3, zero, 1
sll a4, a3, t2
lui s0, 2
addiw s0, s0, 152
and a4, a4, s0
beqz a4, .LBB0_34
# %bb.13: # %assert_end10
bne t1, a3, .LBB0_41
# %bb.14: # %assert_end12
lw a3, 16(a5)
addi a4, zero, 2
bne a3, a4, .LBB0_42
# %bb.15: # %assert_end14
lhu a3, 22(a5)
addi s0, zero, 1
bne a3, s0, .LBB0_43
# %bb.16: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB0_43
# %bb.17: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB0_43
# %bb.18: # %assert_end16
lw a3, 0(a7)
addi s0, zero, 1
bne a3, s0, .LBB0_44
# %bb.19: # %assert_end18
lw a3, 8(a7)
addi a4, zero, 784
bne a3, a4, .LBB0_45
# %bb.20: # %assert_end20
ld a3, 40(a5)
bnez a3, .LBB0_46
# %bb.21: # %assert_end22
lw a3, 16(a2)
addi a4, zero, 4
bne a3, a4, .LBB0_47
# %bb.22: # %assert_end24
lhu a3, 22(a2)
addi s0, zero, 1
bne a3, s0, .LBB0_48
# %bb.23: # %assert_end24
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB0_48
# %bb.24: # %assert_end24
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB0_48
# %bb.25: # %assert_end26
lw a3, 0(t0)
addi s0, zero, 1
bne a3, s0, .LBB0_49
# %bb.26: # %assert_end28
lw a3, 8(t0)
bne a3, s0, .LBB0_50
# %bb.27: # %assert_end30
lw a4, 16(t0)
addi a3, zero, 28
bne a4, a3, .LBB0_51
# %bb.28: # %assert_end32
lw a4, 24(t0)
bne a4, a3, .LBB0_52
# %bb.29: # %assert_end34
ld a3, 40(a2)
bnez a3, .LBB0_53
# %bb.30: # %assert_end36
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB0_54
# %bb.31: # %assert_end38
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB0_56
# %bb.32: # %assert_end40
call fuse_reshape_compute_
mv a0, zero
j .LBB0_37
.LBB0_33: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.3)
addi a0, a0, %lo(.L.str.3)
j .LBB0_35
.LBB0_34: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.4)
addi a0, a0, %lo(.L.str.4)
.LBB0_35: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB0_36: # %assert_fail15
addi a0, a0, -1
.LBB0_37: # %assert_fail15
ld s0, 0(sp)
ld ra, 8(sp)
.cfi_restore ra
.cfi_restore s0
addi sp, sp, 16
.cfi_def_cfa_offset 0
ret
.LBB0_38: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str)
addi a0, a0, %lo(.L.str)
j .LBB0_35
.LBB0_39: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.1)
addi a0, a0, %lo(.L.str.1)
j .LBB0_35
.LBB0_40: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.2)
addi a0, a0, %lo(.L.str.2)
j .LBB0_35
.LBB0_41: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB0_35
.LBB0_42: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.6)
addi a0, a0, %lo(.L.str.6)
j .LBB0_35
.LBB0_43: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB0_55
.LBB0_44: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB0_55
.LBB0_45: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.9)
addi a0, a0, %lo(.L.str.9)
j .LBB0_35
.LBB0_46: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB0_35
.LBB0_47: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.11)
addi a0, a0, %lo(.L.str.11)
j .LBB0_35
.LBB0_48: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB0_55
.LBB0_49: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.13)
addi a0, a0, %lo(.L.str.13)
j .LBB0_55
.LBB0_50: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.14)
addi a0, a0, %lo(.L.str.14)
j .LBB0_35
.LBB0_51: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.15)
addi a0, a0, %lo(.L.str.15)
j .LBB0_35
.LBB0_52: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.16)
addi a0, a0, %lo(.L.str.16)
j .LBB0_35
.LBB0_53: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB0_35
.LBB0_54: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB0_55: # %assert_fail15
jalr a1
slli a0, s0, 32
j .LBB0_36
.LBB0_56: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB0_35
.Lfunc_end0:
.size fuse_reshape, .Lfunc_end0-fuse_reshape
.cfi_endproc
# -- End function
.globl fuse_reshape_compute_ # -- Begin function fuse_reshape_compute_
.p2align 2
.type fuse_reshape_compute_,@function
fuse_reshape_compute_: # @fuse_reshape_compute_
# %bb.0: # %entry
addi sp, sp, -32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
sd s2, 0(sp)
mv s0, a1
mv s1, a0
addi a2, zero, 112
call memcpy
addi a0, s1, 112
addi a1, s0, 112
addi a2, zero, 112
call memcpy
addi a0, s1, 224
addi a1, s0, 224
addi a2, zero, 112
call memcpy
addi a0, s1, 336
addi a1, s0, 336
addi a2, zero, 112
call memcpy
addi a0, s1, 448
addi a1, s0, 448
addi a2, zero, 112
call memcpy
addi a0, s1, 560
addi a1, s0, 560
addi a2, zero, 112
call memcpy
addi a0, s1, 672
addi a1, s0, 672
addi a2, zero, 112
call memcpy
addi a0, s1, 784
addi a1, s0, 784
addi a2, zero, 112
call memcpy
addi a0, s1, 896
addi a1, s0, 896
addi a2, zero, 112
call memcpy
addi a0, s1, 1008
addi a1, s0, 1008
addi a2, zero, 112
call memcpy
addi a0, s1, 1120
addi a1, s0, 1120
addi a2, zero, 112
call memcpy
addi a0, s1, 1232
addi a1, s0, 1232
addi a2, zero, 112
call memcpy
addi a0, s1, 1344
addi a1, s0, 1344
addi a2, zero, 112
call memcpy
addi a0, s1, 1456
addi a1, s0, 1456
addi a2, zero, 112
call memcpy
addi a0, s1, 1568
addi a1, s0, 1568
addi a2, zero, 112
call memcpy
addi a0, s1, 1680
addi a1, s0, 1680
addi a2, zero, 112
call memcpy
addi a0, s1, 1792
addi a1, s0, 1792
addi a2, zero, 112
call memcpy
addi a0, s1, 1904
addi a1, s0, 1904
addi a2, zero, 112
call memcpy
addi a0, s1, 2016
addi a1, s0, 2016
addi a2, zero, 112
call memcpy
lui s2, 1
addiw a1, s2, -1968
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1856
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1744
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1632
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1520
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1408
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1296
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1184
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
addiw a1, s2, -1072
add a0, s1, a1
add a1, s0, a1
addi a2, zero, 112
call memcpy
ld s2, 0(sp)
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
addi sp, sp, 32
ret
.Lfunc_end1:
.size fuse_reshape_compute_, .Lfunc_end1-fuse_reshape_compute_
# -- End function
.globl fuse_conv2d # -- Begin function fuse_conv2d
.p2align 2
.type fuse_conv2d,@function
fuse_conv2d: # @fuse_conv2d
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -64
.cfi_def_cfa_offset 64
sd ra, 56(sp)
sd s0, 48(sp)
sd s1, 40(sp)
sd s2, 32(sp)
sd s3, 24(sp)
sd s4, 16(sp)
sd s5, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
.cfi_offset s2, -32
.cfi_offset s3, -40
.cfi_offset s4, -48
.cfi_offset s5, -56
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 4
bne a2, a3, .LBB2_74
# %bb.1: # %assert_end
lwu t5, 12(a1)
ld a6, 24(a0)
lwu t6, 8(a1)
ld a7, 16(a0)
lwu s3, 4(a1)
ld t3, 8(a0)
lwu s4, 0(a1)
ld s5, 0(a0)
ld t4, 24(s5)
ld a0, 0(s5)
ld a1, 32(s5)
beqz a1, .LBB2_6
# %bb.2: # %if_then
lw a3, 0(a1)
addi a2, zero, 784
bne a3, a2, .LBB2_75
# %bb.3: # %if_then
ld a3, 8(a1)
slli a3, a3, 32
srli a3, a3, 32
bne a3, a2, .LBB2_75
# %bb.4: # %if_then
ld a2, 16(a1)
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 28
bne a2, a3, .LBB2_75
# %bb.5: # %if_then
ld a1, 24(a1)
slli a1, a1, 32
srli a1, a1, 32
addi a2, zero, 1
bne a1, a2, .LBB2_75
.LBB2_6: # %if_end
ld t2, 24(t3)
ld a1, 0(t3)
lwu a4, 12(s5)
lwu s2, 8(s5)
ld a2, 32(t3)
beqz a2, .LBB2_11
# %bb.7: # %if_then3
lw s0, 0(a2)
addi a3, zero, 25
bne s0, a3, .LBB2_76
# %bb.8: # %if_then3
ld s0, 8(a2)
slli s0, s0, 32
srli s0, s0, 32
bne s0, a3, .LBB2_76
# %bb.9: # %if_then3
ld a3, 16(a2)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 5
bne a3, s0, .LBB2_76
# %bb.10: # %if_then3
ld a2, 24(a2)
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 1
bne a2, a3, .LBB2_76
.LBB2_11: # %if_end4
ld t1, 24(a7)
ld a3, 0(a7)
ld a2, 32(a7)
beqz a2, .LBB2_13
# %bb.12: # %if_then7
lw a2, 0(a2)
addi s0, zero, 1
bne a2, s0, .LBB2_77
.LBB2_13: # %if_end8
ld t0, 24(a6)
ld a2, 0(a6)
ld s0, 32(a6)
beqz s0, .LBB2_18
# %bb.14: # %if_then11
lui s1, 6
addiw s1, s1, 512
lw a5, 0(s0)
bne a5, s1, .LBB2_78
# %bb.15: # %if_then11
ld a5, 8(s0)
slli a5, a5, 32
srli a5, a5, 32
addi s1, zero, 784
bne a5, s1, .LBB2_78
# %bb.16: # %if_then11
ld a5, 16(s0)
slli a5, a5, 32
srli a5, a5, 32
addi s1, zero, 28
bne a5, s1, .LBB2_78
# %bb.17: # %if_then11
ld a5, 24(s0)
slli a5, a5, 32
srli a5, a5, 32
addi s0, zero, 1
bne a5, s0, .LBB2_78
.LBB2_18: # %if_end12
addi a5, zero, 13
bltu a5, s4, .LBB2_67
# %bb.19: # %if_end12
addi a5, zero, 1
sll a5, a5, s4
lui s0, 2
addiw s0, s0, 152
and a5, a5, s0
beqz a5, .LBB2_67
# %bb.20: # %assert_end16
addi a5, zero, 13
bltu a5, s3, .LBB2_68
# %bb.21: # %assert_end16
addi a5, zero, 1
sll a5, a5, s3
lui s0, 2
addiw s0, s0, 152
and a5, a5, s0
beqz a5, .LBB2_68
# %bb.22: # %assert_end18
addi a5, zero, 13
bltu a5, t6, .LBB2_69
# %bb.23: # %assert_end18
addi a5, zero, 1
sll a5, a5, t6
lui s1, 2
addiw s1, s1, 152
and a5, a5, s1
beqz a5, .LBB2_69
# %bb.24: # %assert_end20
addi a5, zero, 13
bltu a5, t5, .LBB2_70
# %bb.25: # %assert_end20
addi s1, zero, 1
sll a5, s1, t5
lui s0, 2
addiw s0, s0, 152
and a5, a5, s0
beqz a5, .LBB2_70
# %bb.26: # %assert_end22
bne s2, s1, .LBB2_79
# %bb.27: # %assert_end24
lw a5, 16(s5)
addi s1, zero, 4
bne a5, s1, .LBB2_80
# %bb.28: # %assert_end26
lhu a5, 22(s5)
addi s0, zero, 1
bne a5, s0, .LBB2_81
# %bb.29: # %assert_end26
lbu a5, 21(s5)
addi s1, zero, 32
bne a5, s1, .LBB2_81
# %bb.30: # %assert_end26
lbu a5, 20(s5)
addi s1, zero, 2
bne a5, s1, .LBB2_81
# %bb.31: # %assert_end28
lw a5, 0(t4)
addi s0, zero, 1
bne a5, s0, .LBB2_82
# %bb.32: # %assert_end30
lw a5, 8(t4)
bne a5, s0, .LBB2_83
# %bb.33: # %assert_end32
lw a5, 16(t4)
addi s1, zero, 28
bne a5, s1, .LBB2_84
# %bb.34: # %assert_end34
lw a5, 24(t4)
bne a5, s1, .LBB2_85
# %bb.35: # %assert_end36
ld a5, 40(s5)
bnez a5, .LBB2_86
# %bb.36: # %assert_end38
lw a5, 16(t3)
addi s1, zero, 4
bne a5, s1, .LBB2_87
# %bb.37: # %assert_end40
lhu a5, 22(t3)
addi s0, zero, 1
bne a5, s0, .LBB2_88
# %bb.38: # %assert_end40
lbu a5, 21(t3)
addi s1, zero, 32
bne a5, s1, .LBB2_88
# %bb.39: # %assert_end40
lbu a5, 20(t3)
addi s1, zero, 2
bne a5, s1, .LBB2_88
# %bb.40: # %assert_end42
lw a5, 0(t2)
addi s1, zero, 32
bne a5, s1, .LBB2_89
# %bb.41: # %assert_end44
lw a5, 8(t2)
addi s0, zero, 1
bne a5, s0, .LBB2_90
# %bb.42: # %assert_end46
lw s1, 16(t2)
addi a5, zero, 5
bne s1, a5, .LBB2_91
# %bb.43: # %assert_end48
lw s1, 24(t2)
bne s1, a5, .LBB2_92
# %bb.44: # %assert_end50
ld a5, 40(t3)
bnez a5, .LBB2_93
# %bb.45: # %assert_end52
lw a5, 8(t3)
addi s0, zero, 1
bne a5, s0, .LBB2_94
# %bb.46: # %assert_end54
lw s1, 12(t3)
sext.w a5, a4
bne a5, s1, .LBB2_95
# %bb.47: # %assert_end56
lw s1, 16(a7)
addi s0, zero, 1
bne s1, s0, .LBB2_96
# %bb.48: # %assert_end58
lhu s1, 22(a7)
bne s1, s0, .LBB2_97
# %bb.49: # %assert_end58
lbu s1, 21(a7)
addi s0, zero, 32
bne s1, s0, .LBB2_97
# %bb.50: # %assert_end58
lbu s1, 20(a7)
addi s0, zero, 2
bne s1, s0, .LBB2_97
# %bb.51: # %assert_end60
lw s1, 0(t1)
addi s0, zero, 32
bne s1, s0, .LBB2_98
# %bb.52: # %assert_end62
ld s1, 40(a7)
bnez s1, .LBB2_99
# %bb.53: # %assert_end64
lw s1, 8(a7)
addi s0, zero, 1
bne s1, s0, .LBB2_100
# %bb.54: # %assert_end66
lw s1, 12(a7)
bne a5, s1, .LBB2_101
# %bb.55: # %assert_end68
lw s1, 16(a6)
addi s0, zero, 4
bne s1, s0, .LBB2_102
# %bb.56: # %assert_end70
lhu s1, 22(a6)
addi s2, zero, 1
bne s1, s2, .LBB2_103
# %bb.57: # %assert_end70
lbu s1, 21(a6)
addi s0, zero, 32
bne s1, s0, .LBB2_103
# %bb.58: # %assert_end70
lbu s1, 20(a6)
addi s0, zero, 2
bne s1, s0, .LBB2_103
# %bb.59: # %assert_end72
lw s1, 0(t0)
addi s0, zero, 1
bne s1, s0, .LBB2_104
# %bb.60: # %assert_end74
lw s1, 8(t0)
addi s0, zero, 32
bne s1, s0, .LBB2_105
# %bb.61: # %assert_end76
lw s0, 16(t0)
addi s1, zero, 28
bne s0, s1, .LBB2_106
# %bb.62: # %assert_end78
lw s0, 24(t0)
bne s0, s1, .LBB2_107
# %bb.63: # %assert_end80
ld s1, 40(a6)
bnez s1, .LBB2_108
# %bb.64: # %assert_end82
lw s1, 8(a6)
addi s0, zero, 1
bne s1, s0, .LBB2_109
# %bb.65: # %assert_end84
lw s1, 12(a6)
bne a5, s1, .LBB2_111
# %bb.66: # %assert_end86
call fuse_conv2d_compute_
mv a0, zero
j .LBB2_73
.LBB2_67: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.25)
addi a0, a0, %lo(.L.str.25)
j .LBB2_71
.LBB2_68: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.26)
addi a0, a0, %lo(.L.str.26)
j .LBB2_71
.LBB2_69: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.27)
addi a0, a0, %lo(.L.str.27)
j .LBB2_71
.LBB2_70: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.28)
addi a0, a0, %lo(.L.str.28)
.LBB2_71: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB2_72: # %assert_fail9
addi a0, a0, -1
.LBB2_73: # %assert_fail9
ld s5, 8(sp)
ld s4, 16(sp)
ld s3, 24(sp)
ld s2, 32(sp)
ld s1, 40(sp)
ld s0, 48(sp)
ld ra, 56(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
.cfi_restore s2
.cfi_restore s3
.cfi_restore s4
.cfi_restore s5
addi sp, sp, 64
.cfi_def_cfa_offset 0
ret
.LBB2_74: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.20)
addi a0, a0, %lo(.L.str.20)
j .LBB2_71
.LBB2_75: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.21)
addi a0, a0, %lo(.L.str.21)
j .LBB2_71
.LBB2_76: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.22)
addi a0, a0, %lo(.L.str.22)
j .LBB2_71
.LBB2_77: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.23)
addi a0, a0, %lo(.L.str.23)
j .LBB2_110
.LBB2_78: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.24)
addi a0, a0, %lo(.L.str.24)
j .LBB2_71
.LBB2_79: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB2_71
.LBB2_80: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.29)
addi a0, a0, %lo(.L.str.29)
j .LBB2_71
.LBB2_81: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB2_110
.LBB2_82: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB2_110
.LBB2_83: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.30)
addi a0, a0, %lo(.L.str.30)
j .LBB2_71
.LBB2_84: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.31)
addi a0, a0, %lo(.L.str.31)
j .LBB2_71
.LBB2_85: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.32)
addi a0, a0, %lo(.L.str.32)
j .LBB2_71
.LBB2_86: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB2_71
.LBB2_87: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.11)
addi a0, a0, %lo(.L.str.11)
j .LBB2_71
.LBB2_88: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB2_110
.LBB2_89: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.33)
addi a0, a0, %lo(.L.str.33)
j .LBB2_71
.LBB2_90: # %assert_fail45
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.14)
addi a0, a0, %lo(.L.str.14)
j .LBB2_110
.LBB2_91: # %assert_fail47
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.34)
addi a0, a0, %lo(.L.str.34)
j .LBB2_71
.LBB2_92: # %assert_fail49
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.35)
addi a0, a0, %lo(.L.str.35)
j .LBB2_71
.LBB2_93: # %assert_fail51
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB2_71
.LBB2_94: # %assert_fail53
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
j .LBB2_110
.LBB2_95: # %assert_fail55
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB2_71
.LBB2_96: # %assert_fail57
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.36)
addi a0, a0, %lo(.L.str.36)
j .LBB2_110
.LBB2_97: # %assert_fail59
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.37)
addi a0, a0, %lo(.L.str.37)
j .LBB2_71
.LBB2_98: # %assert_fail61
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.38)
addi a0, a0, %lo(.L.str.38)
j .LBB2_71
.LBB2_99: # %assert_fail63
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.39)
addi a0, a0, %lo(.L.str.39)
j .LBB2_71
.LBB2_100: # %assert_fail65
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.40)
addi a0, a0, %lo(.L.str.40)
j .LBB2_110
.LBB2_101: # %assert_fail67
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.41)
addi a0, a0, %lo(.L.str.41)
j .LBB2_71
.LBB2_102: # %assert_fail69
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.42)
addi a0, a0, %lo(.L.str.42)
j .LBB2_71
.LBB2_103: # %assert_fail71
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.43)
addi a0, a0, %lo(.L.str.43)
jalr a1
slli a0, s2, 32
j .LBB2_72
.LBB2_104: # %assert_fail73
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.44)
addi a0, a0, %lo(.L.str.44)
j .LBB2_110
.LBB2_105: # %assert_fail75
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.45)
addi a0, a0, %lo(.L.str.45)
j .LBB2_71
.LBB2_106: # %assert_fail77
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.46)
addi a0, a0, %lo(.L.str.46)
j .LBB2_71
.LBB2_107: # %assert_fail79
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.47)
addi a0, a0, %lo(.L.str.47)
j .LBB2_71
.LBB2_108: # %assert_fail81
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.48)
addi a0, a0, %lo(.L.str.48)
j .LBB2_71
.LBB2_109: # %assert_fail83
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.49)
addi a0, a0, %lo(.L.str.49)
.LBB2_110: # %assert_fail9
jalr a1
slli a0, s0, 32
j .LBB2_72
.LBB2_111: # %assert_fail85
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.50)
addi a0, a0, %lo(.L.str.50)
j .LBB2_71
.Lfunc_end2:
.size fuse_conv2d, .Lfunc_end2-fuse_conv2d
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_conv2d_compute_
.LCPI3_0:
.word 0 # float 0
.text
.globl fuse_conv2d_compute_
.p2align 2
.type fuse_conv2d_compute_,@function
fuse_conv2d_compute_: # @fuse_conv2d_compute_
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -416
.cfi_def_cfa_offset 416
sd ra, 408(sp)
sd s0, 400(sp)
sd s1, 392(sp)
sd s2, 384(sp)
sd s3, 376(sp)
sd s4, 368(sp)
sd s5, 360(sp)
sd s6, 352(sp)
sd s7, 344(sp)
sd s8, 336(sp)
sd s9, 328(sp)
sd s10, 320(sp)
sd s11, 312(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
.cfi_offset s2, -32
.cfi_offset s3, -40
.cfi_offset s4, -48
.cfi_offset s5, -56
.cfi_offset s6, -64
.cfi_offset s7, -72
.cfi_offset s8, -80
.cfi_offset s9, -88
.cfi_offset s10, -96
.cfi_offset s11, -104
sd a3, 24(sp)
sd a2, 16(sp)
mv s6, a1
mv s7, a0
lui s0, 1
lui a0, 1
call _Znam
mv s8, a0
addiw a0, s0, -896
call _Znam
sd a0, 40(sp)
lui a0, 25
addiw s5, a0, -2048
mv a0, s5
call _Znam
mv s3, a0
mv a0, s5
call _Znam
sd a0, 8(sp)
addi s2, s7, -232
addi s1, zero, 27
lui a0, %hi(.LCPI3_0)
addi a0, a0, %lo(.LCPI3_0)
flw ft1, 0(a0)
addi s0, zero, 32
mv s4, s8
mv s5, zero
fsw ft1, 304(sp)
addiw a0, s5, -2
bgeu s1, a0, .LBB3_4
.LBB3_1: # %for_body8.preheader
slli a0, s5, 7
add a0, s8, a0
mv a1, zero
addi a2, zero, 128
call memset
flw ft1, 304(sp)
.LBB3_2: # %for_end9
addi s4, s4, 128
addi s2, s2, 112
addi s5, s5, 1
beq s5, s0, .LBB3_8
# %bb.3: # %for_begin7.preheader
addiw a0, s5, -2
bltu s1, a0, .LBB3_1
.LBB3_4: # %for_body8.us.preheader
mv a0, s4
mv a1, s2
mv a2, zero
j .LBB3_6
.LBB3_5: # %if_end11.us
# in Loop: Header=BB3_6 Depth=1
fsw ft0, 0(a0)
addi a0, a0, 4
addi a1, a1, 4
addi a2, a2, 1
beq a2, s0, .LBB3_2
.LBB3_6: # %for_body8.us
# =>This Inner Loop Header: Depth=1
addiw a3, a2, -2
fmv.s ft0, ft1
bltu s1, a3, .LBB3_5
# %bb.7: # %if_then10.us
# in Loop: Header=BB3_6 Depth=1
flw ft0, 0(a1)
j .LBB3_5
.LBB3_8: # %for_begin12.preheader
addi a0, s6, 400
ld a1, 40(sp)
addi a1, a1, 80
addi a2, zero, 4
mv a3, zero
.LBB3_9: # %for_begin15.preheader
# =>This Loop Header: Depth=1
# Child Loop BB3_10 Depth 2
addi a4, zero, -100
mv a5, a1
.LBB3_10: # %for_begin18.preheader
# Parent Loop BB3_9 Depth=1
# => This Inner Loop Header: Depth=2
add s0, a0, a4
flw ft0, -300(s0)
fsw ft0, -80(a5)
flw ft0, -200(s0)
fsw ft0, -76(a5)
flw ft0, -100(s0)
fsw ft0, -72(a5)
flw ft0, 0(s0)
fsw ft0, -68(a5)
flw ft0, 100(s0)
fsw ft0, -64(a5)
flw ft0, 200(s0)
fsw ft0, -60(a5)
flw ft0, 300(s0)
fsw ft0, -56(a5)
flw ft0, 400(s0)
fsw ft0, -52(a5)
flw ft0, -296(s0)
fsw ft0, -48(a5)
flw ft0, -196(s0)
fsw ft0, -44(a5)
flw ft0, -96(s0)
fsw ft0, -40(a5)
flw ft0, 4(s0)
fsw ft0, -36(a5)
flw ft0, 104(s0)
fsw ft0, -32(a5)
flw ft0, 204(s0)
fsw ft0, -28(a5)
flw ft0, 304(s0)
fsw ft0, -24(a5)
flw ft0, 404(s0)
fsw ft0, -20(a5)
flw ft0, -292(s0)
fsw ft0, -16(a5)
flw ft0, -192(s0)
fsw ft0, -12(a5)
flw ft0, -92(s0)
fsw ft0, -8(a5)
flw ft0, 8(s0)
fsw ft0, -4(a5)
flw ft0, 108(s0)
fsw ft0, 0(a5)
flw ft0, 208(s0)
fsw ft0, 4(a5)
flw ft0, 308(s0)
fsw ft0, 8(a5)
flw ft0, 408(s0)
fsw ft0, 12(a5)
flw ft0, -288(s0)
fsw ft0, 16(a5)
flw ft0, -188(s0)
fsw ft0, 20(a5)
flw ft0, -88(s0)
fsw ft0, 24(a5)
flw ft0, 12(s0)
fsw ft0, 28(a5)
flw ft0, 112(s0)
fsw ft0, 32(a5)
flw ft0, 212(s0)
fsw ft0, 36(a5)
flw ft0, 312(s0)
fsw ft0, 40(a5)
flw ft0, 412(s0)
fsw ft0, 44(a5)
flw ft0, -284(s0)
fsw ft0, 48(a5)
flw ft0, -184(s0)
fsw ft0, 52(a5)
flw ft0, -84(s0)
fsw ft0, 56(a5)
flw ft0, 16(s0)
fsw ft0, 60(a5)
flw ft0, 116(s0)
fsw ft0, 64(a5)
flw ft0, 216(s0)
fsw ft0, 68(a5)
flw ft0, 316(s0)
fsw ft0, 72(a5)
flw ft0, 416(s0)
fsw ft0, 76(a5)
addi a5, a5, 160
addi a4, a4, 20
bnez a4, .LBB3_10
# %bb.11: # %for_end17
# in Loop: Header=BB3_9 Depth=1
addi a0, a0, 800
addi a1, a1, 800
addi a3, a3, 1
bne a3, a2, .LBB3_9
# %bb.12: # %for_begin24.preheader
sd s8, 288(sp)
lui a0, 131072
addiw a0, a0, -1
sd a0, 32(sp)
addi a6, zero, 28
addi a4, zero, 8
addi a5, zero, 4
addi a3, zero, 1
addi a0, zero, 2
addi a2, zero, 3
mv s0, zero
.LBB3_13: # %for_begin27.preheader
# =>This Loop Header: Depth=1
# Child Loop BB3_14 Depth 2
# Child Loop BB3_16 Depth 2
# Child Loop BB3_17 Depth 3
srli a1, s0, 3
ld s1, 32(sp)
and a1, a1, s1
sd s0, 48(sp)
andi s1, s0, 7
sd s1, 304(sp)
sd a1, 248(sp)
mul a1, a1, a6
sd a1, 160(sp)
mv t3, zero
.LBB3_14: # %for_begin30.preheader
# Parent Loop BB3_13 Depth=1
# => This Inner Loop Header: Depth=2
ld a1, 160(sp)
add a1, t3, a1
addi s1, zero, 224
mul a1, a1, s1
ld s1, 304(sp)
or a1, a1, s1
sext.w s0, a1
slli s0, s0, 2
add s0, s3, s0
sw zero, 0(s0)
ori s0, a1, 8
sext.w s0, s0
slli s0, s0, 2
add s0, s3, s0
sw zero, 0(s0)
ori s0, a1, 16
sext.w s0, s0
slli s0, s0, 2
add s0, s3, s0
sw zero, 0(s0)
ori s0, a1, 24
sext.w s0, s0
slli s0, s0, 2
add s0, s3, s0
sw zero, 0(s0)
addiw s0, a1, 32
slli s0, s0, 2
add s0, s3, s0
sw zero, 0(s0)
addiw s0, a1, 40
slli s0, s0, 2
add s0, s3, s0
sw zero, 0(s0)
addiw s0, a1, 160
slli s1, s0, 2
sd s1, 280(sp)
addiw s0, a1, 168
slli t1, s0, 2
addiw s0, a1, 176
slli t2, s0, 2
addiw s0, a1, 184
slli a7, s0, 2
addiw s0, a1, 192
slli t4, s0, 2
addiw s0, a1, 200
slli t5, s0, 2
addiw s0, a1, 208
slli t6, s0, 2
addiw s0, a1, 216
slli s2, s0, 2
addiw s0, a1, 104
slli s1, s0, 2
sd s1, 256(sp)
addiw s0, a1, 112
slli s4, s0, 2
addiw s0, a1, 120
slli s5, s0, 2
addiw s0, a1, 128
slli s6, s0, 2
addiw s0, a1, 136
slli s7, s0, 2
addiw s0, a1, 144
slli s8, s0, 2
addiw s0, a1, 152
slli s9, s0, 2
addiw s0, a1, 64
slli s10, s0, 2
addiw s0, a1, 72
slli s11, s0, 2
addiw s0, a1, 80
slli s0, s0, 2
addiw a6, a1, 88
slli a6, a6, 2
addiw t0, a1, 96
slli t0, t0, 2
add s1, s3, s2
sd s1, 296(sp)
add s1, s3, t6
sd s1, 272(sp)
add s1, s3, t5
sd s1, 264(sp)
add t6, s3, t4
add t5, s3, a7
add t4, s3, t2
add t2, s3, t1
ld s1, 280(sp)
add t1, s3, s1
add s9, s3, s9
add s8, s3, s8
add s7, s3, s7
add s6, s3, s6
add s5, s3, s5
add s4, s3, s4
ld s1, 256(sp)
add s1, s3, s1
add t0, s3, t0
add a6, s3, a6
add a7, s3, s0
add s11, s3, s11
add s10, s3, s10
addiw s2, a1, 56
slli s0, s2, 2
add s0, s3, s0
addiw a1, a1, 48
slli a1, a1, 2
add a1, s3, a1
sw zero, 0(a1)
sw zero, 0(s0)
sw zero, 0(s10)
sw zero, 0(s11)
sw zero, 0(a7)
sw zero, 0(a6)
sw zero, 0(t0)
sw zero, 0(s1)
sw zero, 0(s4)
sw zero, 0(s5)
sw zero, 0(s6)
sw zero, 0(s7)
sw zero, 0(s8)
sw zero, 0(s9)
sw zero, 0(t1)
sw zero, 0(t2)
sw zero, 0(t4)
sw zero, 0(t5)
sw zero, 0(t6)
ld a1, 264(sp)
sw zero, 0(a1)
ld a1, 272(sp)
sw zero, 0(a1)
ld a1, 296(sp)
sw zero, 0(a1)
addi a1, t3, 1
addiw s0, t3, 1
mv t3, a1
addi a1, zero, 28
bltu s0, a1, .LBB3_14
# %bb.15: # %for_begin33.preheader
# in Loop: Header=BB3_13 Depth=1
ld a1, 160(sp)
addi a1, zero, 200
ld s1, 248(sp)
mul a1, s1, a1
ld s1, 304(sp)
or a1, a1, s1
addi s0, a1, 184
slli a6, s0, 32
addi s0, a1, 192
slli s0, s0, 32
srli a7, s0, 32
srli a6, a6, 32
addi s0, a1, 8
slli t0, s0, 32
addi s0, a1, 16
slli t1, s0, 32
addi s0, a1, 24
slli t2, s0, 32
addi s0, a1, 32
slli t3, s0, 32
addi s0, a1, 40
slli t4, s0, 32
addi s0, a1, 96
slli t5, s0, 32
addi s0, a1, 152
slli s1, s0, 32
sd s1, 280(sp)
addi s0, a1, 48
slli s2, s0, 32
addi s0, a1, 56
slli s1, s0, 32
addi s0, a1, 64
slli s4, s0, 32
addi s0, a1, 72
slli s5, s0, 32
addi s0, a1, 80
slli s6, s0, 32
addi s0, a1, 88
slli s7, s0, 32
slli s0, a1, 32
srli s8, s0, 32
srli s0, t4, 32
sd s0, 296(sp)
srli s0, t3, 32
sd s0, 256(sp)
srli s0, t2, 32
sd s0, 248(sp)
srli s0, t1, 32
sd s0, 240(sp)
srli s0, t0, 32
sd s0, 232(sp)
slli s0, a6, 2
sd s0, 264(sp)
slli t0, a7, 2
addi s0, a1, 168
slli s9, s0, 32
addi s0, a1, 104
slli s10, s0, 32
addi s0, a1, 112
slli s11, s0, 32
addi s0, a1, 120
slli a6, s0, 32
addi t4, a1, 128
slli t4, t4, 32
addi t6, a1, 136
slli t6, t6, 32
addi t3, a1, 144
slli t3, t3, 32
slli s8, s8, 2
addi t2, a1, 160
slli t2, t2, 32
srli t5, t5, 32
srli s7, s7, 32
srli s6, s6, 32
srli s5, s5, 32
srli s4, s4, 32
srli s1, s1, 32
srli s2, s2, 32
ld s0, 280(sp)
srli t1, s0, 32
srli t3, t3, 32
srli t6, t6, 32
srli t4, t4, 32
srli a7, a6, 32
srli s11, s11, 32
srli s10, s10, 32
srli s9, s9, 32
srli t2, t2, 32
ld a6, 40(sp)
add s0, a6, s8
sd s0, 280(sp)
add s0, a6, t0
sd s0, 272(sp)
ld s0, 264(sp)
add s0, a6, s0
sd s0, 264(sp)
ld s0, 232(sp)
slli s0, s0, 2
sd s0, 152(sp)
ld s0, 240(sp)
slli s0, s0, 2
sd s0, 144(sp)
ld s0, 248(sp)
slli s0, s0, 2
sd s0, 136(sp)
ld s0, 256(sp)
slli s0, s0, 2
sd s0, 80(sp)
ld s0, 296(sp)
slli s0, s0, 2
sd s0, 296(sp)
slli s0, s2, 2
sd s0, 96(sp)
slli s8, s1, 2
slli s2, s4, 2
slli s5, s5, 2
slli s4, s6, 2
slli t0, s7, 2
slli t5, t5, 2
slli s10, s10, 2
slli s6, s11, 2
slli s7, a7, 2
slli t4, t4, 2
slli t6, t6, 2
slli t3, t3, 2
slli s1, t1, 2
slli t2, t2, 2
slli s0, s9, 2
addi a1, a1, 176
slli a1, a1, 32
srli a1, a1, 32
slli a1, a1, 2
add a1, a6, a1
sd a1, 256(sp)
add a1, a6, s0
sd a1, 248(sp)
add a1, a6, t2
sd a1, 240(sp)
add a1, a6, s1
sd a1, 232(sp)
add a1, a6, t3
sd a1, 224(sp)
add a1, a6, t6
sd a1, 216(sp)
add a1, a6, t4
sd a1, 208(sp)
add a1, a6, s7
sd a1, 200(sp)
add a1, a6, s6
sd a1, 192(sp)
add a1, a6, s10
sd a1, 184(sp)
add a1, a6, t5
sd a1, 176(sp)
add a1, a6, t0
sd a1, 168(sp)
add a1, a6, s4
sd a1, 128(sp)
add a1, a6, s5
sd a1, 120(sp)
add a1, a6, s2
sd a1, 112(sp)
add a1, a6, s8
sd a1, 104(sp)
ld a1, 96(sp)
add a1, a6, a1
sd a1, 88(sp)
ld a1, 296(sp)
add a1, a6, a1
sd a1, 96(sp)
ld a1, 80(sp)
add a1, a6, a1
sd a1, 80(sp)
ld a1, 136(sp)
add a1, a6, a1
sd a1, 72(sp)
ld a1, 144(sp)
add a1, a6, a1
sd a1, 64(sp)
ld a1, 152(sp)
add a1, a6, a1
sd a1, 56(sp)
mv s4, zero
mv s1, zero
mv s0, zero
.LBB3_16: # %for_begin36.preheader
# Parent Loop BB3_13 Depth=1
# => This Loop Header: Depth=2
# Child Loop BB3_17 Depth 3
sd s1, 144(sp)
ld a1, 160(sp)
sd s0, 136(sp)
add a1, s0, a1
addi s10, zero, 7
mul a1, a1, s10
sd a1, 296(sp)
sd s4, 152(sp)
mv t0, zero
ld s8, 128(sp)
ld s9, 120(sp)
ld s11, 112(sp)
ld s5, 104(sp)
ld t3, 96(sp)
ld t5, 88(sp)
ld s6, 80(sp)
ld t4, 72(sp)
ld t6, 64(sp)
ld s7, 56(sp)
.LBB3_17: # %for_body37
# Parent Loop BB3_13 Depth=1
# Parent Loop BB3_16 Depth=2
# => This Inner Loop Header: Depth=3
ld a1, 296(sp)
add s1, t0, a1
slli s1, s1, 5
ld a1, 304(sp)
or s1, s1, a1
vsetvl a1, a5, a4
ld a1, 288(sp)
add a7, a1, s4
vle.v v0, ( a7 )
ld a1, 280(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v1, a1
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, a1
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, a1
ori a1, s1, 24
sext.w a1, a1
slli a1, a1, 2
add a6, s3, a1
flw ft0, 0(a6)
fmv.x.w a1, ft0
sext.w s0, s1
slli s0, s0, 2
add t1, s3, s0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v2, s0
vslide1up.vx v3, v2, a1
vfmul.vv v0, v0, v1
ori a1, s1, 16
sext.w a1, a1
slli a1, a1, 2
add s2, s3, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v3, a1
ori a1, s1, 8
sext.w a1, a1
slli a1, a1, 2
add t2, s3, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 4
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(s7)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 8
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(t6)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 12
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(t4)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 16
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(s6)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 128
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(t3)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 132
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(t5)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 136
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(s5)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 140
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(s11)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 144
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(s9)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 256
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
flw ft0, 0(s8)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 260
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 168(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 264
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 176(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 268
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 184(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 272
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 192(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 384
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 200(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 388
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 208(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 392
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 216(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 396
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 224(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 400
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 232(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 512
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 240(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 516
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 248(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 520
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 256(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 524
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s0, ft0
vmv.v.x v1, s0
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s0
ld a1, 264(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
vsetvl a1, a5, a4
addi a1, a7, 528
vle.v v0, ( a1 )
flw ft0, 0(a6)
fmv.x.w a1, ft0
flw ft0, 0(t1)
fmv.x.w s1, ft0
vmv.v.x v1, s1
vslide1up.vx v2, v1, a1
flw ft0, 0(s2)
fmv.x.w a1, ft0
vslide1up.vx v1, v2, a1
flw ft0, 0(t2)
fmv.x.w a1, ft0
vslide1up.vx v2, v1, a1
vslide1up.vx v1, v2, s1
ld a1, 272(sp)
flw ft0, 0(a1)
fmv.x.w a1, ft0
vmv.v.x v2, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vslide1up.vx v3, v2, a1
vslide1up.vx v2, v3, a1
vfmul.vv v0, v0, v2
vfadd.vv v0, v0, v1
vslideup.vx v1, v0, zero
vfmv.f.s ft0, v1
fsw ft0, 0(t1)
vslideup.vx v1, v0, a3
vfmv.f.s ft0, v1
fsw ft0, 0(t2)
vslideup.vx v1, v0, a0
vfmv.f.s ft0, v1
fsw ft0, 0(s2)
vslideup.vx v1, v0, a2
vfmv.f.s ft0, v1
fsw ft0, 0(a6)
addi s4, s4, 16
addi t0, t0, 1
addi s10, s10, -1
bnez s10, .LBB3_17
# %bb.18: # %for_end38
# in Loop: Header=BB3_16 Depth=2
ld s4, 152(sp)
addi s4, s4, 128
ld s0, 136(sp)
addi s0, s0, 1
ld s1, 144(sp)
addi s1, s1, 1
addi a1, zero, 28
bne s1, a1, .LBB3_16
# %bb.19: # %for_end35
# in Loop: Header=BB3_13 Depth=1
ld s1, 48(sp)
addi a1, s1, 1
addiw s1, s1, 1
mv s0, a1
addi a6, zero, 28
addi a1, zero, 32
bgeu s1, a1, .LBB3_20
j .LBB3_13
.LBB3_20: # %for_begin39.preheader
addi t2, zero, 28
addi t6, zero, 112
lui a0, 1
addiw a7, a0, -960
addi a6, zero, 32
ld a0, 8(sp)
mv t0, a0
mv t1, zero
ld s2, 288(sp)
.LBB3_21: # %for_begin42.preheader
# =>This Loop Header: Depth=1
# Child Loop BB3_22 Depth 2
# Child Loop BB3_23 Depth 3
srliw a1, t1, 3
mul t3, a1, t2
andi a3, t1, 7
mv a4, t0
mv t4, zero
mv t5, zero
.LBB3_22: # %for_begin45.preheader
# Parent Loop BB3_21 Depth=1
# => This Loop Header: Depth=2
# Child Loop BB3_23 Depth 3
add a1, t5, t3
mul a1, a1, t2
mv s0, zero
mv a2, zero
.LBB3_23: # %for_body46
# Parent Loop BB3_21 Depth=1
# Parent Loop BB3_22 Depth=2
# => This Inner Loop Header: Depth=3
add s1, a2, a1
slli s1, s1, 3
or s1, s1, a3
sext.w s1, s1
slli s1, s1, 2
add s1, s3, s1
add a5, a4, s0
flw ft0, 0(s1)
fsw ft0, 0(a5)
addi a2, a2, 1
addi s0, s0, 4
bne s0, t6, .LBB3_23
# %bb.24: # %for_end47
# in Loop: Header=BB3_22 Depth=2
addi a4, a4, 112
addi t5, t5, 1
addi t4, t4, 1
bne t4, t2, .LBB3_22
# %bb.25: # %for_end44
# in Loop: Header=BB3_21 Depth=1
add t0, t0, a7
addi t1, t1, 1
bne t1, a6, .LBB3_21
# %bb.26: # %for_begin48.preheader
addi s1, zero, 56
lui a1, 1
addiw a7, a1, -960
addi a6, zero, 32
mv a3, zero
ld t0, 24(sp)
ld a1, 16(sp)
.LBB3_27: # %for_begin51.preheader
# =>This Loop Header: Depth=1
# Child Loop BB3_28 Depth 2
slli a2, a3, 2
add a2, t0, a2
addi a4, zero, 28
flw ft0, 0(a2)
mv a5, s1
.LBB3_28: # %for_begin54.preheader
# Parent Loop BB3_27 Depth=1
# => This Inner Loop Header: Depth=2
add s0, a1, a5
add a2, a0, a5
flw ft1, -56(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -56(s0)
flw ft1, -52(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -52(s0)
flw ft1, -48(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -48(s0)
flw ft1, -44(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -44(s0)
flw ft1, -40(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -40(s0)
flw ft1, -36(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -36(s0)
flw ft1, -32(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -32(s0)
flw ft1, -28(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -28(s0)
flw ft1, -24(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -24(s0)
flw ft1, -20(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -20(s0)
flw ft1, -16(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -16(s0)
flw ft1, -12(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -12(s0)
flw ft1, -8(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -8(s0)
flw ft1, -4(a2)
fadd.s ft1, ft0, ft1
fsw ft1, -4(s0)
flw ft1, 0(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 0(s0)
flw ft1, 4(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 4(s0)
flw ft1, 8(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 8(s0)
flw ft1, 12(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 12(s0)
flw ft1, 16(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 16(s0)
flw ft1, 20(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 20(s0)
flw ft1, 24(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 24(s0)
flw ft1, 28(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 28(s0)
flw ft1, 32(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 32(s0)
flw ft1, 36(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 36(s0)
flw ft1, 40(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 40(s0)
flw ft1, 44(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 44(s0)
flw ft1, 48(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 48(s0)
flw ft1, 52(a2)
fadd.s ft1, ft0, ft1
fsw ft1, 52(s0)
addi a5, a5, 112
addi a4, a4, -1
bnez a4, .LBB3_28
# %bb.29: # %for_end53
# in Loop: Header=BB3_27 Depth=1
add s1, s1, a7
addi a3, a3, 1
bne a3, a6, .LBB3_27
# %bb.30: # %for_end50
call _ZdaPv
mv a0, s3
call _ZdaPv
ld a0, 40(sp)
call _ZdaPv
mv a0, s2
call _ZdaPv
ld s11, 312(sp)
ld s10, 320(sp)
ld s9, 328(sp)
ld s8, 336(sp)
ld s7, 344(sp)
ld s6, 352(sp)
ld s5, 360(sp)
ld s4, 368(sp)
ld s3, 376(sp)
ld s2, 384(sp)
ld s1, 392(sp)
ld s0, 400(sp)
ld ra, 408(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
.cfi_restore s2
.cfi_restore s3
.cfi_restore s4
.cfi_restore s5
.cfi_restore s6
.cfi_restore s7
.cfi_restore s8
.cfi_restore s9
.cfi_restore s10
.cfi_restore s11
addi sp, sp, 416
.cfi_def_cfa_offset 0
ret
.Lfunc_end3:
.size fuse_conv2d_compute_, .Lfunc_end3-fuse_conv2d_compute_
.cfi_endproc
# -- End function
.globl fuse_relu # -- Begin function fuse_relu
.p2align 2
.type fuse_relu,@function
fuse_relu: # @fuse_relu
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -32
.cfi_def_cfa_offset 32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB4_30
# %bb.1: # %assert_end
lwu a4, 4(a1)
ld a2, 8(a0)
lwu a3, 0(a1)
ld a5, 0(a0)
ld t0, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB4_3
# %bb.2: # %if_then
lw a0, 0(a0)
addi s0, zero, 1
bne a0, s0, .LBB4_31
.LBB4_3: # %if_end
ld a7, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld s0, 32(a2)
beqz s0, .LBB4_5
# %bb.4: # %if_then3
lw s0, 0(s0)
addi s1, zero, 1
bne s0, s1, .LBB4_32
.LBB4_5: # %if_end4
addi s1, zero, 13
bltu s1, a3, .LBB4_25
# %bb.6: # %if_end4
addi s1, zero, 1
sll a3, s1, a3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB4_25
# %bb.7: # %assert_end8
addi a3, zero, 13
bltu a3, a4, .LBB4_26
# %bb.8: # %assert_end8
addi a3, zero, 1
sll a4, a3, a4
lui s1, 2
addiw s1, s1, 152
and a4, a4, s1
beqz a4, .LBB4_26
# %bb.9: # %assert_end10
bne t1, a3, .LBB4_33
# %bb.10: # %assert_end12
lw a3, 16(a5)
addi s0, zero, 1
bne a3, s0, .LBB4_34
# %bb.11: # %assert_end14
lhu a3, 22(a5)
bne a3, s0, .LBB4_35
# %bb.12: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB4_35
# %bb.13: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB4_35
# %bb.14: # %assert_end16
lui a3, 6
addiw a3, a3, 512
lw a4, 0(t0)
bne a4, a3, .LBB4_36
# %bb.15: # %assert_end18
ld a3, 40(a5)
bnez a3, .LBB4_37
# %bb.16: # %assert_end20
lw a3, 16(a2)
addi s0, zero, 1
bne a3, s0, .LBB4_38
# %bb.17: # %assert_end22
lhu a3, 22(a2)
bne a3, s0, .LBB4_39
# %bb.18: # %assert_end22
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB4_39
# %bb.19: # %assert_end22
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB4_39
# %bb.20: # %assert_end24
lui a3, 6
addiw a3, a3, 512
lw a4, 0(a7)
bne a4, a3, .LBB4_40
# %bb.21: # %assert_end26
ld a3, 40(a2)
bnez a3, .LBB4_41
# %bb.22: # %assert_end28
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB4_42
# %bb.23: # %assert_end30
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB4_44
# %bb.24: # %assert_end32
call fuse_relu_compute_
mv a0, zero
j .LBB4_29
.LBB4_25: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.54)
addi a0, a0, %lo(.L.str.54)
j .LBB4_27
.LBB4_26: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.55)
addi a0, a0, %lo(.L.str.55)
.LBB4_27: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB4_28: # %assert_fail1
addi a0, a0, -1
.LBB4_29: # %assert_fail1
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
addi sp, sp, 32
.cfi_def_cfa_offset 0
ret
.LBB4_30: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.51)
addi a0, a0, %lo(.L.str.51)
j .LBB4_27
.LBB4_31: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.52)
addi a0, a0, %lo(.L.str.52)
j .LBB4_43
.LBB4_32: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.53)
addi a0, a0, %lo(.L.str.53)
jalr a1
slli a0, s1, 32
j .LBB4_28
.LBB4_33: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB4_27
.LBB4_34: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.56)
addi a0, a0, %lo(.L.str.56)
j .LBB4_43
.LBB4_35: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB4_27
.LBB4_36: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.57)
addi a0, a0, %lo(.L.str.57)
j .LBB4_27
.LBB4_37: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB4_27
.LBB4_38: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.58)
addi a0, a0, %lo(.L.str.58)
j .LBB4_43
.LBB4_39: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB4_27
.LBB4_40: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.59)
addi a0, a0, %lo(.L.str.59)
j .LBB4_27
.LBB4_41: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB4_27
.LBB4_42: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB4_43: # %assert_fail1
jalr a1
slli a0, s0, 32
j .LBB4_28
.LBB4_44: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB4_27
.Lfunc_end4:
.size fuse_relu, .Lfunc_end4-fuse_relu
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_relu_compute_
.LCPI5_0:
.word 0 # float 0
.text
.globl fuse_relu_compute_
.p2align 2
.type fuse_relu_compute_,@function
fuse_relu_compute_: # @fuse_relu_compute_
# %bb.0: # %entry
lui a2, 6
addiw a2, a2, 512
lui a3, %hi(.LCPI5_0)
addi a3, a3, %lo(.LCPI5_0)
flw ft0, 0(a3)
.LBB5_1: # %for_body
# =>This Inner Loop Header: Depth=1
flw ft1, 0(a1)
fmax.s ft1, ft1, ft0
fsw ft1, 0(a0)
addi a1, a1, 4
addi a0, a0, 4
addi a2, a2, -1
bnez a2, .LBB5_1
# %bb.2: # %for_end
ret
.Lfunc_end5:
.size fuse_relu_compute_, .Lfunc_end5-fuse_relu_compute_
# -- End function
.globl fuse_max_pool2d # -- Begin function fuse_max_pool2d
.p2align 2
.type fuse_max_pool2d,@function
fuse_max_pool2d: # @fuse_max_pool2d
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -16
.cfi_def_cfa_offset 16
sd ra, 8(sp)
sd s0, 0(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB6_42
# %bb.1: # %assert_end
lwu t0, 4(a1)
ld a2, 8(a0)
lwu t3, 0(a1)
ld a5, 0(a0)
ld t2, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB6_6
# %bb.2: # %if_then
lui a3, 6
addiw a3, a3, 512
lw s0, 0(a0)
bne s0, a3, .LBB6_43
# %bb.3: # %if_then
ld a3, 8(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 784
bne a3, s0, .LBB6_43
# %bb.4: # %if_then
ld a3, 16(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 28
bne a3, s0, .LBB6_43
# %bb.5: # %if_then
ld a0, 24(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a3, zero, 1
bne a0, a3, .LBB6_43
.LBB6_6: # %if_end
ld a7, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld a3, 32(a2)
beqz a3, .LBB6_11
# %bb.7: # %if_then3
lui s0, 2
addiw s0, s0, -1920
lw a4, 0(a3)
bne a4, s0, .LBB6_44
# %bb.8: # %if_then3
ld a4, 8(a3)
slli a4, a4, 32
srli a4, a4, 32
addi s0, zero, 196
bne a4, s0, .LBB6_44
# %bb.9: # %if_then3
ld a4, 16(a3)
slli a4, a4, 32
srli a4, a4, 32
addi s0, zero, 14
bne a4, s0, .LBB6_44
# %bb.10: # %if_then3
ld a3, 24(a3)
slli a3, a3, 32
srli a3, a3, 32
addi a4, zero, 1
bne a3, a4, .LBB6_44
.LBB6_11: # %if_end4
addi a3, zero, 13
bltu a3, t3, .LBB6_37
# %bb.12: # %if_end4
addi a3, zero, 1
sll a3, a3, t3
lui a4, 2
addiw a4, a4, 152
and a3, a3, a4
beqz a3, .LBB6_37
# %bb.13: # %assert_end8
addi a3, zero, 13
bltu a3, t0, .LBB6_38
# %bb.14: # %assert_end8
addi a3, zero, 1
sll a4, a3, t0
lui s0, 2
addiw s0, s0, 152
and a4, a4, s0
beqz a4, .LBB6_38
# %bb.15: # %assert_end10
bne t1, a3, .LBB6_45
# %bb.16: # %assert_end12
lw a3, 16(a5)
addi a4, zero, 4
bne a3, a4, .LBB6_46
# %bb.17: # %assert_end14
lhu a3, 22(a5)
addi s0, zero, 1
bne a3, s0, .LBB6_47
# %bb.18: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB6_47
# %bb.19: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB6_47
# %bb.20: # %assert_end16
lw a3, 0(t2)
addi s0, zero, 1
bne a3, s0, .LBB6_48
# %bb.21: # %assert_end18
lw a3, 8(t2)
addi a4, zero, 32
bne a3, a4, .LBB6_49
# %bb.22: # %assert_end20
lw a4, 16(t2)
addi a3, zero, 28
bne a4, a3, .LBB6_50
# %bb.23: # %assert_end22
lw a4, 24(t2)
bne a4, a3, .LBB6_51
# %bb.24: # %assert_end24
ld a3, 40(a5)
bnez a3, .LBB6_52
# %bb.25: # %assert_end26
lw a3, 16(a2)
addi a4, zero, 4
bne a3, a4, .LBB6_53
# %bb.26: # %assert_end28
lhu a3, 22(a2)
addi s0, zero, 1
bne a3, s0, .LBB6_54
# %bb.27: # %assert_end28
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB6_54
# %bb.28: # %assert_end28
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB6_54
# %bb.29: # %assert_end30
lw a3, 0(a7)
addi s0, zero, 1
bne a3, s0, .LBB6_55
# %bb.30: # %assert_end32
lw a3, 8(a7)
addi a4, zero, 32
bne a3, a4, .LBB6_56
# %bb.31: # %assert_end34
lw a4, 16(a7)
addi a3, zero, 14
bne a4, a3, .LBB6_57
# %bb.32: # %assert_end36
lw a4, 24(a7)
bne a4, a3, .LBB6_58
# %bb.33: # %assert_end38
ld a3, 40(a2)
bnez a3, .LBB6_59
# %bb.34: # %assert_end40
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB6_60
# %bb.35: # %assert_end42
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB6_62
# %bb.36: # %assert_end44
call fuse_max_pool2d_compute_
mv a0, zero
j .LBB6_41
.LBB6_37: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.63)
addi a0, a0, %lo(.L.str.63)
j .LBB6_39
.LBB6_38: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.64)
addi a0, a0, %lo(.L.str.64)
.LBB6_39: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB6_40: # %assert_fail15
addi a0, a0, -1
.LBB6_41: # %assert_fail15
ld s0, 0(sp)
ld ra, 8(sp)
.cfi_restore ra
.cfi_restore s0
addi sp, sp, 16
.cfi_def_cfa_offset 0
ret
.LBB6_42: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.60)
addi a0, a0, %lo(.L.str.60)
j .LBB6_39
.LBB6_43: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.61)
addi a0, a0, %lo(.L.str.61)
j .LBB6_39
.LBB6_44: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.62)
addi a0, a0, %lo(.L.str.62)
j .LBB6_39
.LBB6_45: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB6_39
.LBB6_46: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.29)
addi a0, a0, %lo(.L.str.29)
j .LBB6_39
.LBB6_47: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB6_61
.LBB6_48: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB6_61
.LBB6_49: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.65)
addi a0, a0, %lo(.L.str.65)
j .LBB6_39
.LBB6_50: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.31)
addi a0, a0, %lo(.L.str.31)
j .LBB6_39
.LBB6_51: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.32)
addi a0, a0, %lo(.L.str.32)
j .LBB6_39
.LBB6_52: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB6_39
.LBB6_53: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.11)
addi a0, a0, %lo(.L.str.11)
j .LBB6_39
.LBB6_54: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB6_61
.LBB6_55: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.13)
addi a0, a0, %lo(.L.str.13)
j .LBB6_61
.LBB6_56: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.66)
addi a0, a0, %lo(.L.str.66)
j .LBB6_39
.LBB6_57: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.67)
addi a0, a0, %lo(.L.str.67)
j .LBB6_39
.LBB6_58: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.68)
addi a0, a0, %lo(.L.str.68)
j .LBB6_39
.LBB6_59: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB6_39
.LBB6_60: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB6_61: # %assert_fail15
jalr a1
slli a0, s0, 32
j .LBB6_40
.LBB6_62: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB6_39
.Lfunc_end6:
.size fuse_max_pool2d, .Lfunc_end6-fuse_max_pool2d
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_max_pool2d_compute_
.LCPI7_0:
.word 4286578687 # float -3.40282347E+38
.text
.globl fuse_max_pool2d_compute_
.p2align 2
.type fuse_max_pool2d_compute_,@function
fuse_max_pool2d_compute_: # @fuse_max_pool2d_compute_
# %bb.0: # %entry
addi t0, a1, 4
lui a1, %hi(.LCPI7_0)
addi a1, a1, %lo(.LCPI7_0)
flw ft0, 0(a1)
addi a2, zero, 56
addi t2, zero, 14
lui a1, 1
addiw a7, a1, -960
addi a6, zero, 32
mv t1, zero
j .LBB7_2
.LBB7_1: # %for_end3
# in Loop: Header=BB7_2 Depth=1
add t0, t0, a7
addi a0, a0, 784
addi t1, t1, 1
beq t1, a6, .LBB7_14
.LBB7_2: # %for_begin1.preheader
# =>This Loop Header: Depth=1
# Child Loop BB7_4 Depth 2
# Child Loop BB7_6 Depth 3
mv t3, t0
mv a4, a0
mv t4, zero
j .LBB7_4
.LBB7_3: # %for_end6
# in Loop: Header=BB7_4 Depth=2
addi t3, t3, 224
addi a4, a4, 56
addi t4, t4, 1
beq t4, t2, .LBB7_1
.LBB7_4: # %for_begin4.preheader
# Parent Loop BB7_2 Depth=1
# => This Loop Header: Depth=2
# Child Loop BB7_6 Depth 3
mv a1, t3
mv a3, zero
j .LBB7_6
.LBB7_5: # %for_body5
# in Loop: Header=BB7_6 Depth=3
add a5, a4, a3
fsw ft1, 0(a5)
addi a1, a1, 8
addi a3, a3, 4
beq a3, a2, .LBB7_3
.LBB7_6: # %for_body5
# Parent Loop BB7_2 Depth=1
# Parent Loop BB7_4 Depth=2
# => This Inner Loop Header: Depth=3
flw ft2, -4(a1)
flt.s a5, ft2, ft0
fmv.s ft1, ft0
bnez a5, .LBB7_8
# %bb.7: # %for_body5
# in Loop: Header=BB7_6 Depth=3
fmv.s ft1, ft2
.LBB7_8: # %for_body5
# in Loop: Header=BB7_6 Depth=3
flw ft2, 0(a1)
flt.s a5, ft2, ft1
bnez a5, .LBB7_10
# %bb.9: # %for_body5
# in Loop: Header=BB7_6 Depth=3
fmv.s ft1, ft2
.LBB7_10: # %for_body5
# in Loop: Header=BB7_6 Depth=3
flw ft2, 108(a1)
flt.s a5, ft2, ft1
bnez a5, .LBB7_12
# %bb.11: # %for_body5
# in Loop: Header=BB7_6 Depth=3
fmv.s ft1, ft2
.LBB7_12: # %for_body5
# in Loop: Header=BB7_6 Depth=3
flw ft2, 112(a1)
flt.s a5, ft2, ft1
bnez a5, .LBB7_5
# %bb.13: # %for_body5
# in Loop: Header=BB7_6 Depth=3
fmv.s ft1, ft2
j .LBB7_5
.LBB7_14: # %for_end
ret
.Lfunc_end7:
.size fuse_max_pool2d_compute_, .Lfunc_end7-fuse_max_pool2d_compute_
# -- End function
.globl fuse_conv2d_1 # -- Begin function fuse_conv2d_1
.p2align 2
.type fuse_conv2d_1,@function
fuse_conv2d_1: # @fuse_conv2d_1
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -64
.cfi_def_cfa_offset 64
sd ra, 56(sp)
sd s0, 48(sp)
sd s1, 40(sp)
sd s2, 32(sp)
sd s3, 24(sp)
sd s4, 16(sp)
sd s5, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
.cfi_offset s2, -32
.cfi_offset s3, -40
.cfi_offset s4, -48
.cfi_offset s5, -56
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 4
bne a2, a3, .LBB8_74
# %bb.1: # %assert_end
lwu t5, 12(a1)
ld a6, 24(a0)
lwu t6, 8(a1)
ld a7, 16(a0)
lwu s3, 4(a1)
ld t3, 8(a0)
lwu s4, 0(a1)
ld s5, 0(a0)
ld t4, 24(s5)
ld a0, 0(s5)
ld a1, 32(s5)
beqz a1, .LBB8_6
# %bb.2: # %if_then
lui a2, 2
addiw a2, a2, -1920
lw a3, 0(a1)
bne a3, a2, .LBB8_75
# %bb.3: # %if_then
ld a2, 8(a1)
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 196
bne a2, a3, .LBB8_75
# %bb.4: # %if_then
ld a2, 16(a1)
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 14
bne a2, a3, .LBB8_75
# %bb.5: # %if_then
ld a1, 24(a1)
slli a1, a1, 32
srli a1, a1, 32
addi a2, zero, 1
bne a1, a2, .LBB8_75
.LBB8_6: # %if_end
ld t2, 24(t3)
ld a1, 0(t3)
lwu a4, 12(s5)
lwu s2, 8(s5)
ld a2, 32(t3)
beqz a2, .LBB8_11
# %bb.7: # %if_then3
lw a3, 0(a2)
addi s0, zero, 800
bne a3, s0, .LBB8_76
# %bb.8: # %if_then3
ld a3, 8(a2)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 25
bne a3, s0, .LBB8_76
# %bb.9: # %if_then3
ld a3, 16(a2)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 5
bne a3, s0, .LBB8_76
# %bb.10: # %if_then3
ld a2, 24(a2)
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 1
bne a2, a3, .LBB8_76
.LBB8_11: # %if_end4
ld t1, 24(a7)
ld a3, 0(a7)
ld a2, 32(a7)
beqz a2, .LBB8_13
# %bb.12: # %if_then7
lw a2, 0(a2)
addi s0, zero, 1
bne a2, s0, .LBB8_77
.LBB8_13: # %if_end8
ld t0, 24(a6)
ld a2, 0(a6)
ld s0, 32(a6)
beqz s0, .LBB8_18
# %bb.14: # %if_then11
lui s1, 3
addiw s1, s1, 256
lw a5, 0(s0)
bne a5, s1, .LBB8_78
# %bb.15: # %if_then11
ld a5, 8(s0)
slli a5, a5, 32
srli a5, a5, 32
addi s1, zero, 196
bne a5, s1, .LBB8_78
# %bb.16: # %if_then11
ld a5, 16(s0)
slli a5, a5, 32
srli a5, a5, 32
addi s1, zero, 14
bne a5, s1, .LBB8_78
# %bb.17: # %if_then11
ld a5, 24(s0)
slli a5, a5, 32
srli a5, a5, 32
addi s0, zero, 1
bne a5, s0, .LBB8_78
.LBB8_18: # %if_end12
addi a5, zero, 13
bltu a5, s4, .LBB8_67
# %bb.19: # %if_end12
addi a5, zero, 1
sll a5, a5, s4
lui s0, 2
addiw s0, s0, 152
and a5, a5, s0
beqz a5, .LBB8_67
# %bb.20: # %assert_end16
addi a5, zero, 13
bltu a5, s3, .LBB8_68
# %bb.21: # %assert_end16
addi a5, zero, 1
sll a5, a5, s3
lui s0, 2
addiw s0, s0, 152
and a5, a5, s0
beqz a5, .LBB8_68
# %bb.22: # %assert_end18
addi a5, zero, 13
bltu a5, t6, .LBB8_69
# %bb.23: # %assert_end18
addi a5, zero, 1
sll a5, a5, t6
lui s1, 2
addiw s1, s1, 152
and a5, a5, s1
beqz a5, .LBB8_69
# %bb.24: # %assert_end20
addi a5, zero, 13
bltu a5, t5, .LBB8_70
# %bb.25: # %assert_end20
addi s1, zero, 1
sll a5, s1, t5
lui s0, 2
addiw s0, s0, 152
and a5, a5, s0
beqz a5, .LBB8_70
# %bb.26: # %assert_end22
bne s2, s1, .LBB8_79
# %bb.27: # %assert_end24
lw a5, 16(s5)
addi s1, zero, 4
bne a5, s1, .LBB8_80
# %bb.28: # %assert_end26
lhu a5, 22(s5)
addi s0, zero, 1
bne a5, s0, .LBB8_81
# %bb.29: # %assert_end26
lbu a5, 21(s5)
addi s1, zero, 32
bne a5, s1, .LBB8_81
# %bb.30: # %assert_end26
lbu a5, 20(s5)
addi s1, zero, 2
bne a5, s1, .LBB8_81
# %bb.31: # %assert_end28
lw a5, 0(t4)
addi s0, zero, 1
bne a5, s0, .LBB8_82
# %bb.32: # %assert_end30
lw a5, 8(t4)
addi s1, zero, 32
bne a5, s1, .LBB8_83
# %bb.33: # %assert_end32
lw a5, 16(t4)
addi s1, zero, 14
bne a5, s1, .LBB8_84
# %bb.34: # %assert_end34
lw a5, 24(t4)
bne a5, s1, .LBB8_85
# %bb.35: # %assert_end36
ld a5, 40(s5)
bnez a5, .LBB8_86
# %bb.36: # %assert_end38
lw a5, 16(t3)
addi s1, zero, 4
bne a5, s1, .LBB8_87
# %bb.37: # %assert_end40
lhu a5, 22(t3)
addi s0, zero, 1
bne a5, s0, .LBB8_88
# %bb.38: # %assert_end40
lbu a5, 21(t3)
addi s1, zero, 32
bne a5, s1, .LBB8_88
# %bb.39: # %assert_end40
lbu a5, 20(t3)
addi s1, zero, 2
bne a5, s1, .LBB8_88
# %bb.40: # %assert_end42
lw a5, 0(t2)
addi s1, zero, 64
bne a5, s1, .LBB8_89
# %bb.41: # %assert_end44
lw a5, 8(t2)
addi s1, zero, 32
bne a5, s1, .LBB8_90
# %bb.42: # %assert_end46
lw s1, 16(t2)
addi a5, zero, 5
bne s1, a5, .LBB8_91
# %bb.43: # %assert_end48
lw s1, 24(t2)
bne s1, a5, .LBB8_92
# %bb.44: # %assert_end50
ld a5, 40(t3)
bnez a5, .LBB8_93
# %bb.45: # %assert_end52
lw a5, 8(t3)
addi s0, zero, 1
bne a5, s0, .LBB8_94
# %bb.46: # %assert_end54
lw s1, 12(t3)
sext.w a5, a4
bne a5, s1, .LBB8_95
# %bb.47: # %assert_end56
lw s1, 16(a7)
addi s0, zero, 1
bne s1, s0, .LBB8_96
# %bb.48: # %assert_end58
lhu s1, 22(a7)
bne s1, s0, .LBB8_97
# %bb.49: # %assert_end58
lbu s1, 21(a7)
addi s0, zero, 32
bne s1, s0, .LBB8_97
# %bb.50: # %assert_end58
lbu s1, 20(a7)
addi s0, zero, 2
bne s1, s0, .LBB8_97
# %bb.51: # %assert_end60
lw s1, 0(t1)
addi s0, zero, 64
bne s1, s0, .LBB8_98
# %bb.52: # %assert_end62
ld s1, 40(a7)
bnez s1, .LBB8_99
# %bb.53: # %assert_end64
lw s1, 8(a7)
addi s0, zero, 1
bne s1, s0, .LBB8_100
# %bb.54: # %assert_end66
lw s1, 12(a7)
bne a5, s1, .LBB8_101
# %bb.55: # %assert_end68
lw s1, 16(a6)
addi s0, zero, 4
bne s1, s0, .LBB8_102
# %bb.56: # %assert_end70
lhu s1, 22(a6)
addi s2, zero, 1
bne s1, s2, .LBB8_103
# %bb.57: # %assert_end70
lbu s1, 21(a6)
addi s0, zero, 32
bne s1, s0, .LBB8_103
# %bb.58: # %assert_end70
lbu s1, 20(a6)
addi s0, zero, 2
bne s1, s0, .LBB8_103
# %bb.59: # %assert_end72
lw s1, 0(t0)
addi s0, zero, 1
bne s1, s0, .LBB8_104
# %bb.60: # %assert_end74
lw s1, 8(t0)
addi s0, zero, 64
bne s1, s0, .LBB8_105
# %bb.61: # %assert_end76
lw s0, 16(t0)
addi s1, zero, 14
bne s0, s1, .LBB8_106
# %bb.62: # %assert_end78
lw s0, 24(t0)
bne s0, s1, .LBB8_107
# %bb.63: # %assert_end80
ld s1, 40(a6)
bnez s1, .LBB8_108
# %bb.64: # %assert_end82
lw s1, 8(a6)
addi s0, zero, 1
bne s1, s0, .LBB8_109
# %bb.65: # %assert_end84
lw s1, 12(a6)
bne a5, s1, .LBB8_111
# %bb.66: # %assert_end86
call fuse_conv2d_1_compute_
mv a0, zero
j .LBB8_73
.LBB8_67: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.73)
addi a0, a0, %lo(.L.str.73)
j .LBB8_71
.LBB8_68: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.74)
addi a0, a0, %lo(.L.str.74)
j .LBB8_71
.LBB8_69: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.75)
addi a0, a0, %lo(.L.str.75)
j .LBB8_71
.LBB8_70: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.76)
addi a0, a0, %lo(.L.str.76)
.LBB8_71: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB8_72: # %assert_fail9
addi a0, a0, -1
.LBB8_73: # %assert_fail9
ld s5, 8(sp)
ld s4, 16(sp)
ld s3, 24(sp)
ld s2, 32(sp)
ld s1, 40(sp)
ld s0, 48(sp)
ld ra, 56(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
.cfi_restore s2
.cfi_restore s3
.cfi_restore s4
.cfi_restore s5
addi sp, sp, 64
.cfi_def_cfa_offset 0
ret
.LBB8_74: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.69)
addi a0, a0, %lo(.L.str.69)
j .LBB8_71
.LBB8_75: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.70)
addi a0, a0, %lo(.L.str.70)
j .LBB8_71
.LBB8_76: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.71)
addi a0, a0, %lo(.L.str.71)
j .LBB8_71
.LBB8_77: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.23)
addi a0, a0, %lo(.L.str.23)
j .LBB8_110
.LBB8_78: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.72)
addi a0, a0, %lo(.L.str.72)
j .LBB8_71
.LBB8_79: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB8_71
.LBB8_80: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.29)
addi a0, a0, %lo(.L.str.29)
j .LBB8_71
.LBB8_81: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB8_110
.LBB8_82: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB8_110
.LBB8_83: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.65)
addi a0, a0, %lo(.L.str.65)
j .LBB8_71
.LBB8_84: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.77)
addi a0, a0, %lo(.L.str.77)
j .LBB8_71
.LBB8_85: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.78)
addi a0, a0, %lo(.L.str.78)
j .LBB8_71
.LBB8_86: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB8_71
.LBB8_87: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.11)
addi a0, a0, %lo(.L.str.11)
j .LBB8_71
.LBB8_88: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB8_110
.LBB8_89: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.79)
addi a0, a0, %lo(.L.str.79)
j .LBB8_71
.LBB8_90: # %assert_fail45
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.66)
addi a0, a0, %lo(.L.str.66)
j .LBB8_71
.LBB8_91: # %assert_fail47
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.34)
addi a0, a0, %lo(.L.str.34)
j .LBB8_71
.LBB8_92: # %assert_fail49
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.35)
addi a0, a0, %lo(.L.str.35)
j .LBB8_71
.LBB8_93: # %assert_fail51
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB8_71
.LBB8_94: # %assert_fail53
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
j .LBB8_110
.LBB8_95: # %assert_fail55
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB8_71
.LBB8_96: # %assert_fail57
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.36)
addi a0, a0, %lo(.L.str.36)
j .LBB8_110
.LBB8_97: # %assert_fail59
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.37)
addi a0, a0, %lo(.L.str.37)
j .LBB8_71
.LBB8_98: # %assert_fail61
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.80)
addi a0, a0, %lo(.L.str.80)
j .LBB8_71
.LBB8_99: # %assert_fail63
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.39)
addi a0, a0, %lo(.L.str.39)
j .LBB8_71
.LBB8_100: # %assert_fail65
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.40)
addi a0, a0, %lo(.L.str.40)
j .LBB8_110
.LBB8_101: # %assert_fail67
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.41)
addi a0, a0, %lo(.L.str.41)
j .LBB8_71
.LBB8_102: # %assert_fail69
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.42)
addi a0, a0, %lo(.L.str.42)
j .LBB8_71
.LBB8_103: # %assert_fail71
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.43)
addi a0, a0, %lo(.L.str.43)
jalr a1
slli a0, s2, 32
j .LBB8_72
.LBB8_104: # %assert_fail73
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.44)
addi a0, a0, %lo(.L.str.44)
j .LBB8_110
.LBB8_105: # %assert_fail75
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.81)
addi a0, a0, %lo(.L.str.81)
j .LBB8_71
.LBB8_106: # %assert_fail77
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.82)
addi a0, a0, %lo(.L.str.82)
j .LBB8_71
.LBB8_107: # %assert_fail79
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.83)
addi a0, a0, %lo(.L.str.83)
j .LBB8_71
.LBB8_108: # %assert_fail81
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.48)
addi a0, a0, %lo(.L.str.48)
j .LBB8_71
.LBB8_109: # %assert_fail83
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.49)
addi a0, a0, %lo(.L.str.49)
.LBB8_110: # %assert_fail9
jalr a1
slli a0, s0, 32
j .LBB8_72
.LBB8_111: # %assert_fail85
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.50)
addi a0, a0, %lo(.L.str.50)
j .LBB8_71
.Lfunc_end8:
.size fuse_conv2d_1, .Lfunc_end8-fuse_conv2d_1
.cfi_endproc
# -- End function
.globl fuse_conv2d_1_compute_ # -- Begin function fuse_conv2d_1_compute_
.p2align 2
.type fuse_conv2d_1_compute_,@function
fuse_conv2d_1_compute_: # @fuse_conv2d_1_compute_
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -320
.cfi_def_cfa_offset 320
sd ra, 312(sp)
sd s0, 304(sp)
sd s1, 296(sp)
sd s2, 288(sp)
sd s3, 280(sp)
sd s4, 272(sp)
sd s5, 264(sp)
sd s6, 256(sp)
sd s7, 248(sp)
sd s8, 240(sp)
sd s9, 232(sp)
sd s10, 224(sp)
sd s11, 216(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
.cfi_offset s2, -32
.cfi_offset s3, -40
.cfi_offset s4, -48
.cfi_offset s5, -56
.cfi_offset s6, -64
.cfi_offset s7, -72
.cfi_offset s8, -80
.cfi_offset s9, -88
.cfi_offset s10, -96
.cfi_offset s11, -104
sd a3, 32(sp)
sd a2, 24(sp)
mv s11, a1
mv s6, a0
lui a0, 50
call _Znam
mv s0, a0
lui a0, 10
addiw a0, a0, 512
call _Znam
mv s8, a0
lui a0, 12
addiw a0, a0, 1024
call _Znam
mv s9, a0
addi s2, s6, -112
sd s0, 56(sp)
addi s4, s0, 36
addi s5, zero, 14
addi s6, zero, 18
addi s7, zero, 32
mv s3, zero
.LBB9_1: # %for_begin5.preheader
# =>This Inner Loop Header: Depth=1
mv s0, s2
mv s1, s4
mv s10, zero
addiw a0, s10, -2
bltu a0, s5, .LBB9_5
.LBB9_2: # %for_body9.preheader
# in Loop: Header=BB9_1 Depth=1
addi a0, s1, -36
mv a1, zero
addi a2, zero, 72
call memset
.LBB9_3: # %for_end10
# in Loop: Header=BB9_1 Depth=1
addi s0, s0, 56
addi s1, s1, 72
addi s10, s10, 1
beq s10, s6, .LBB9_6
# %bb.4: # %for_begin8.preheader
# in Loop: Header=BB9_1 Depth=1
addiw a0, s10, -2
bgeu a0, s5, .LBB9_2
.LBB9_5: # %if_end12.us.17
# in Loop: Header=BB9_1 Depth=1
sw zero, -32(s1)
sw zero, -36(s1)
flw ft0, 0(s0)
fsw ft0, -28(s1)
flw ft0, 4(s0)
fsw ft0, -24(s1)
flw ft0, 8(s0)
fsw ft0, -20(s1)
flw ft0, 12(s0)
fsw ft0, -16(s1)
flw ft0, 16(s0)
fsw ft0, -12(s1)
flw ft0, 20(s0)
fsw ft0, -8(s1)
flw ft0, 24(s0)
fsw ft0, -4(s1)
flw ft0, 28(s0)
fsw ft0, 0(s1)
flw ft0, 32(s0)
fsw ft0, 4(s1)
flw ft0, 36(s0)
fsw ft0, 8(s1)
flw ft0, 40(s0)
fsw ft0, 12(s1)
flw ft0, 44(s0)
fsw ft0, 16(s1)
flw ft0, 48(s0)
fsw ft0, 20(s1)
flw ft0, 52(s0)
sw zero, 32(s1)
sw zero, 28(s1)
fsw ft0, 24(s1)
j .LBB9_3
.LBB9_6: # %for_end7
# in Loop: Header=BB9_1 Depth=1
addi s2, s2, 784
addi s4, s4, 1296
addi s3, s3, 1
bne s3, s7, .LBB9_1
# %bb.7: # %for_begin13.preheader
ld a0, 56(sp)
addi t0, a0, 36
addi a1, zero, 644
addi t3, zero, 18
lui a0, 3
addiw a7, a0, -1920
addi a6, zero, 4
mv t2, zero
mv t1, zero
.LBB9_8: # %for_begin16.preheader
# =>This Loop Header: Depth=1
# Child Loop BB9_9 Depth 2
# Child Loop BB9_10 Depth 3
mv a4, t0
mv a5, t2
mv a3, zero
.LBB9_9: # %for_begin19.preheader
# Parent Loop BB9_8 Depth=1
# => This Loop Header: Depth=2
# Child Loop BB9_10 Depth 3
add s0, s8, a5
addi s1, zero, 68
mv a0, a4
.LBB9_10: # %for_begin22.preheader
# Parent Loop BB9_8 Depth=1
# Parent Loop BB9_9 Depth=2
# => This Inner Loop Header: Depth=3
add a2, s0, s1
flw ft0, -36(a0)
fsw ft0, -68(a2)
flw ft0, -32(a0)
fsw ft0, -64(a2)
flw ft0, -28(a0)
fsw ft0, -60(a2)
flw ft0, -24(a0)
fsw ft0, -56(a2)
flw ft0, -20(a0)
fsw ft0, -52(a2)
flw ft0, -16(a0)
fsw ft0, -48(a2)
flw ft0, -12(a0)
fsw ft0, -44(a2)
flw ft0, -8(a0)
fsw ft0, -40(a2)
flw ft0, -4(a0)
fsw ft0, -36(a2)
flw ft0, 0(a0)
fsw ft0, -32(a2)
flw ft0, 4(a0)
fsw ft0, -28(a2)
flw ft0, 8(a0)
fsw ft0, -24(a2)
flw ft0, 12(a0)
fsw ft0, -20(a2)
flw ft0, 16(a0)
fsw ft0, -16(a2)
flw ft0, 20(a0)
fsw ft0, -12(a2)
flw ft0, 24(a0)
fsw ft0, -8(a2)
flw ft0, 28(a0)
fsw ft0, -4(a2)
flw ft0, 32(a0)
fsw ft0, 0(a2)
addi a0, a0, 1296
addi s1, s1, 72
bne s1, a1, .LBB9_10
# %bb.11: # %for_end21
# in Loop: Header=BB9_9 Depth=2
addi a4, a4, 72
addi a5, a5, 576
addi a3, a3, 1
bne a3, t3, .LBB9_9
# %bb.12: # %for_end18
# in Loop: Header=BB9_8 Depth=1
add t0, t0, a7
add t2, t2, a7
addi t1, t1, 1
bne t1, a6, .LBB9_8
# %bb.13: # %for_begin25.preheader
lui a0, 1
addiw a0, a0, -896
lui a1, 3
addiw a6, a1, 512
add t0, s11, a0
lui a0, 5
addiw a7, a0, 1920
addiw a0, a0, -1280
lui a3, 4
addiw a3, a3, -384
lui a4, 2
addiw a5, a4, 1408
addiw a4, a4, -1792
sd a4, 120(sp)
add t1, s11, a4
add s2, s11, a5
add s4, s11, a6
add t5, s11, a3
add s1, s11, a0
add s6, s11, a7
ld a0, 56(sp)
addi t6, a0, 16
addi a4, zero, 800
addi a5, zero, 5
lui a0, 6
addiw a0, a0, 1024
sd a0, 16(sp)
mv a2, zero
.LBB9_14: # %for_begin28.preheader
# =>This Loop Header: Depth=1
# Child Loop BB9_15 Depth 2
# Child Loop BB9_16 Depth 3
# Child Loop BB9_17 Depth 4
# Child Loop BB9_18 Depth 5
sd a2, 8(sp)
sd t6, 40(sp)
sd s11, 112(sp)
mv s5, s11
sd t0, 104(sp)
sd t1, 96(sp)
sd s2, 88(sp)
sd s4, 80(sp)
sd t5, 72(sp)
sd s1, 64(sp)
mv a7, s1
sd s6, 48(sp)
mv a2, zero
.LBB9_15: # %for_begin31.preheader
# Parent Loop BB9_14 Depth=1
# => This Loop Header: Depth=2
# Child Loop BB9_16 Depth 3
# Child Loop BB9_17 Depth 4
# Child Loop BB9_18 Depth 5
sd a2, 128(sp)
sd t6, 200(sp)
sd s5, 192(sp)
sd t0, 184(sp)
sd t1, 176(sp)
sd s2, 168(sp)
sd s4, 160(sp)
sd t5, 152(sp)
sd a7, 144(sp)
sd s6, 136(sp)
mv s7, zero
.LBB9_16: # %for_begin34.preheader
# Parent Loop BB9_14 Depth=1
# Parent Loop BB9_15 Depth=2
# => This Loop Header: Depth=3
# Child Loop BB9_17 Depth 4
# Child Loop BB9_18 Depth 5
sd t6, 208(sp)
mv s11, s5
mv a2, t0
mv a1, t1
mv a3, s2
mv a0, s4
mv t2, t5
mv t3, a7
mv t4, s6
mv s1, zero
.LBB9_17: # %for_begin37.preheader
# Parent Loop BB9_14 Depth=1
# Parent Loop BB9_15 Depth=2
# Parent Loop BB9_16 Depth=3
# => This Loop Header: Depth=4
# Child Loop BB9_18 Depth 5
mv s10, t6
mv a6, zero
.LBB9_18: # %for_begin40.preheader
# Parent Loop BB9_14 Depth=1
# Parent Loop BB9_15 Depth=2
# Parent Loop BB9_16 Depth=3
# Parent Loop BB9_17 Depth=4
# => This Inner Loop Header: Depth=5
add s3, s11, a6
flw ft0, 0(s3)
fsw ft0, -16(s10)
add s0, a2, a6
flw ft0, 0(s0)
fsw ft0, -12(s10)
add s0, a1, a6
flw ft0, 0(s0)
fsw ft0, -8(s10)
add s0, a3, a6
flw ft0, 0(s0)
fsw ft0, -4(s10)
add s0, a0, a6
flw ft0, 0(s0)
fsw ft0, 0(s10)
add s0, t2, a6
flw ft0, 0(s0)
fsw ft0, 4(s10)
add s0, t3, a6
flw ft0, 0(s0)
fsw ft0, 8(s10)
add s0, t4, a6
flw ft0, 0(s0)
fsw ft0, 12(s10)
addi s10, s10, 32
addi a6, a6, 100
bne a6, a4, .LBB9_18
# %bb.19: # %for_end39
# in Loop: Header=BB9_17 Depth=4
addi t6, t6, 256
addi s11, s11, 4
addi a2, a2, 4
addi a1, a1, 4
addi a3, a3, 4
addi a0, a0, 4
addi t2, t2, 4
addi t3, t3, 4
addi t4, t4, 4
addi s1, s1, 1
bne s1, a5, .LBB9_17
# %bb.20: # %for_end36
# in Loop: Header=BB9_16 Depth=3
ld t6, 208(sp)
addi t6, t6, 1280
addi s5, s5, 20
addi t0, t0, 20
addi t1, t1, 20
addi s2, s2, 20
addi s4, s4, 20
addi t5, t5, 20
addi a7, a7, 20
addi s6, s6, 20
addi s7, s7, 1
bne s7, a5, .LBB9_16
# %bb.21: # %for_end33
# in Loop: Header=BB9_15 Depth=2
ld a0, 120(sp)
ld t6, 200(sp)
add t6, t6, a0
ld s5, 192(sp)
addi s5, s5, 800
ld t0, 184(sp)
addi t0, t0, 800
ld t1, 176(sp)
addi t1, t1, 800
ld s2, 168(sp)
addi s2, s2, 800
ld s4, 160(sp)
addi s4, s4, 800
ld t5, 152(sp)
addi t5, t5, 800
ld a7, 144(sp)
addi a7, a7, 800
ld s6, 136(sp)
addi s6, s6, 800
ld a2, 128(sp)
addi a2, a2, 1
addi a0, zero, 4
bne a2, a0, .LBB9_15
# %bb.22: # %for_end30
# in Loop: Header=BB9_14 Depth=1
ld t6, 40(sp)
ld a0, 16(sp)
add t6, t6, a0
ld s11, 112(sp)
add s11, s11, a0
ld t0, 104(sp)
add t0, t0, a0
ld t1, 96(sp)
add t1, t1, a0
ld s2, 88(sp)
add s2, s2, a0
ld s4, 80(sp)
add s4, s4, a0
ld t5, 72(sp)
add t5, t5, a0
ld s1, 64(sp)
add s1, s1, a0
ld s6, 48(sp)
add s6, s6, a0
ld a2, 8(sp)
addi a2, a2, 1
addi a0, zero, 8
bne a2, a0, .LBB9_14
# %bb.23: # %for_begin43.preheader
lui a0, 131072
addiw a0, a0, -1
sd a0, 48(sp)
addi t6, zero, 14
addi a3, zero, 112
addi s2, zero, 18
lui a5, 1
mv a2, zero
.LBB9_24: # %for_begin46.preheader
# =>This Loop Header: Depth=1
# Child Loop BB9_25 Depth 2
# Child Loop BB9_27 Depth 2
# Child Loop BB9_28 Depth 3
# Child Loop BB9_29 Depth 4
srli a0, a2, 3
ld a1, 48(sp)
and t4, a0, a1
sd a2, 16(sp)
andi s11, a2, 7
mul s4, t4, t6
mv a1, zero
.LBB9_25: # %for_begin49.preheader
# Parent Loop BB9_24 Depth=1
# => This Inner Loop Header: Depth=2
add a2, a1, s4
mul a2, a2, a3
or a2, a2, s11
sext.w a4, a2
slli a4, a4, 2
add a4, s9, a4
sw zero, 0(a4)
ori a4, a2, 8
sext.w a4, a4
slli a4, a4, 2
add a4, s9, a4
sw zero, 0(a4)
addiw a4, a2, 16
slli a4, a4, 2
add a4, s9, a4
sw zero, 0(a4)
addiw a4, a2, 24
slli a4, a4, 2
add a4, s9, a4
sw zero, 0(a4)
addiw a4, a2, 32
slli a4, a4, 2
add a4, s9, a4
sw zero, 0(a4)
addiw a4, a2, 40
slli a4, a4, 2
add a4, s9, a4
sw zero, 0(a4)
addiw a4, a2, 64
slli t5, a4, 2
addiw s1, a2, 72
slli s3, s1, 2
addiw s0, a2, 80
slli s0, s0, 2
addiw a0, a2, 88
slli a0, a0, 2
addiw a4, a2, 96
slli a4, a4, 2
addiw s1, a2, 104
slli s1, s1, 2
add s5, s9, s1
add s6, s9, a4
add s7, s9, a0
add s0, s9, s0
add s1, s9, s3
add a4, s9, t5
addiw a0, a2, 56
slli a0, a0, 2
add a0, s9, a0
addiw a2, a2, 48
slli a2, a2, 2
add a2, s9, a2
sw zero, 0(a2)
sw zero, 0(a0)
sw zero, 0(a4)
sw zero, 0(s1)
sw zero, 0(s0)
sw zero, 0(s7)
sw zero, 0(s6)
sw zero, 0(s5)
addi a0, a1, 1
addiw a2, a1, 1
mv a1, a0
bltu a2, t6, .LBB9_25
# %bb.26: # %for_begin52.preheader
# in Loop: Header=BB9_24 Depth=1
slli a0, t4, 2
sd a0, 40(sp)
mv a3, zero
.LBB9_27: # %for_begin55.preheader
# Parent Loop BB9_24 Depth=1
# => This Loop Header: Depth=2
# Child Loop BB9_28 Depth 3
# Child Loop BB9_29 Depth 4
srli a0, a3, 3
ld a1, 48(sp)
and a0, a0, a1
ld a1, 40(sp)
add a1, a0, a1
addi a2, zero, 200
mul a1, a1, a2
sd a3, 64(sp)
andi s5, a3, 7
or a1, a1, s5
slli a1, a1, 3
or a1, a1, s11
mul s6, a0, s2
addiw a0, a1, 192
slli a0, a0, 2
sd a0, 208(sp)
addiw a2, a1, 128
slli a0, a2, 2
sd a0, 184(sp)
addiw a4, a1, 64
slli a0, a4, 2
sd a0, 176(sp)
sext.w s0, a1
slli a3, s0, 2
addiw s1, a1, 1536
slli s10, s1, 2
addiw a0, a1, 1472
slli s7, a0, 2
addiw a2, a1, 640
slli a0, a2, 2
sd a0, 200(sp)
addiw a2, a1, 576
slli a0, a2, 2
sd a0, 168(sp)
addiw a4, a1, 512
slli a0, a4, 2
sd a0, 160(sp)
addiw a7, a1, 448
slli a0, a7, 2
sd a0, 144(sp)
addiw t0, a1, 384
slli a0, t0, 2
sd a0, 136(sp)
addiw a6, a1, 320
slli s1, a6, 2
addiw t1, a1, 256
slli t1, t1, 2
addiw t2, a1, 1408
addiw t3, a1, 1280
addiw t4, a1, 704
addiw t5, a1, 768
addiw s3, a1, 832
addiw a6, a1, 896
addiw a4, a1, 960
addiw a2, a1, 1024
addiw a0, a1, 1088
addiw t0, a1, 1152
addiw a7, a1, 1216
addiw a1, a1, 1344
slli s0, a0, 2
slli a2, a2, 2
slli a4, a4, 2
slli a6, a6, 2
slli s3, s3, 2
slli t5, t5, 2
slli t4, t4, 2
slli t3, t3, 2
slli a7, a7, 2
slli t0, t0, 2
ld a0, 56(sp)
add s7, a0, s7
add s10, a0, s10
slli t2, t2, 2
slli a1, a1, 2
add a3, a0, a3
sd a3, 192(sp)
ld a3, 176(sp)
add a3, a0, a3
sd a3, 176(sp)
ld a3, 184(sp)
add a3, a0, a3
sd a3, 184(sp)
ld a3, 208(sp)
add a3, a0, a3
sd a3, 208(sp)
add a3, a0, t1
sd a3, 152(sp)
add a3, a0, s1
sd a3, 112(sp)
ld a3, 136(sp)
add a3, a0, a3
sd a3, 120(sp)
ld a3, 144(sp)
add a3, a0, a3
sd a3, 144(sp)
ld a3, 160(sp)
add s1, a0, a3
ld a3, 168(sp)
add t1, a0, a3
ld a3, 200(sp)
add a3, a0, a3
add t4, a0, t4
add t5, a0, t5
add s3, a0, s3
add a6, a0, a6
add a4, a0, a4
add a2, a0, a2
add s0, a0, s0
add t0, a0, t0
add a7, a0, a7
add t3, a0, t3
add a1, a0, a1
add t2, a0, t2
flw ft0, 0(s10)
flw ft1, 0(s7)
flw ft2, 0(t2)
flw ft3, 0(a1)
flw ft4, 0(t3)
flw ft5, 0(a7)
flw fs3, 0(t0)
flw fs4, 0(s0)
flw fa0, 0(a2)
flw fa1, 0(a4)
flw fa2, 0(a6)
flw fa3, 0(s3)
flw fa4, 0(t5)
flw fa5, 0(t4)
flw fa6, 0(a3)
flw fa7, 0(t1)
flw ft8, 0(s1)
ld a0, 144(sp)
flw ft9, 0(a0)
fsw ft9, 128(sp)
ld a0, 120(sp)
flw ft9, 0(a0)
fsw ft9, 120(sp)
ld a0, 112(sp)
flw ft9, 0(a0)
fsw ft9, 112(sp)
ld a0, 152(sp)
flw ft9, 0(a0)
fsw ft9, 104(sp)
ld a0, 208(sp)
flw ft9, 0(a0)
fsw ft9, 96(sp)
ld a0, 184(sp)
flw ft9, 0(a0)
fsw ft9, 88(sp)
ld a0, 176(sp)
flw ft9, 0(a0)
ld a0, 192(sp)
flw fs0, 0(a0)
mv s7, zero
fsw ft0, 136(sp)
fsw ft1, 80(sp)
fsw ft2, 72(sp)
.LBB9_28: # %for_begin58.preheader
# Parent Loop BB9_24 Depth=1
# Parent Loop BB9_27 Depth=2
# => This Loop Header: Depth=3
# Child Loop BB9_29 Depth 4
add a0, s7, s6
slli a0, a0, 3
or a0, a0, s5
mul a1, a0, s2
add a0, s7, s4
addi a2, zero, 14
mul a0, a0, a2
slli a1, a1, 32
srli a1, a1, 32
slli a1, a1, 2
mv a4, zero
.LBB9_29: # %for_body59
# Parent Loop BB9_24 Depth=1
# Parent Loop BB9_27 Depth=2
# Parent Loop BB9_28 Depth=3
# => This Inner Loop Header: Depth=4
add s0, s8, a1
flw fs5, 0(s0)
fmul.s fs5, fs5, fs0
add s1, a4, a0
slli s1, s1, 3
or s1, s1, s11
sext.w s1, s1
slli s1, s1, 2
add s1, s9, s1
flw fs6, 0(s1)
fadd.s fs5, fs5, fs6
flw fs6, 4(s0)
fmul.s fs6, fs6, ft9
fadd.s ft11, fs6, fs5
fsw ft11, 176(sp)
addiw a3, a5, -1776
add a3, s0, a3
flw fs5, 0(a3)
fmul.s ft0, fs5, ft0
fsw ft0, 208(sp)
addiw a3, a5, -1780
add a3, s0, a3
flw fs6, 0(a3)
fmul.s ft0, fs6, ft1
fsw ft0, 200(sp)
addiw a3, a5, -1784
add a3, s0, a3
flw fs7, 0(a3)
fmul.s ft0, fs7, ft2
fsw ft0, 192(sp)
addiw a3, a5, -1788
add a3, s0, a3
flw fs9, 0(a3)
fmul.s ft0, fs9, ft3
fsw ft0, 184(sp)
addiw a3, a5, -1792
add a3, s0, a3
flw fs10, 0(a3)
fmul.s ft0, fs10, ft4
fsw ft0, 168(sp)
flw fs11, 1744(s0)
fmul.s ft0, fs11, ft5
fsw ft0, 160(sp)
flw ft0, 1740(s0)
fmul.s ft0, ft0, fs3
fsw ft0, 152(sp)
flw ft1, 1736(s0)
fmul.s ft0, ft1, fs4
fsw ft0, 144(sp)
flw ft2, 1732(s0)
fmul.s fs10, ft2, fa0
fmv.s fs9, ft3
flw ft3, 1728(s0)
fmul.s fs8, ft3, fa1
fmv.s fs7, ft4
flw ft4, 1168(s0)
fmul.s fs6, ft4, fa2
fmv.s fs5, ft5
flw ft5, 1164(s0)
fmul.s fs2, ft5, fa3
flw ft6, 1160(s0)
fmul.s fs1, ft6, fa4
flw ft7, 1156(s0)
fmul.s ft11, ft7, fa5
fmv.s ft10, ft9
fmv.s ft9, fa0
flw fa0, 1152(s0)
fmul.s fa0, fa0, fa6
fmv.s ft7, fa1
flw fa1, 592(s0)
fmul.s fa1, fa1, fa7
fmv.s ft6, fa2
flw fa2, 588(s0)
fmul.s fa2, fa2, ft8
fmv.s ft5, fa3
flw fa3, 584(s0)
flw ft0, 128(sp)
fmul.s fa3, fa3, ft0
fmv.s ft4, fa4
flw fa4, 580(s0)
flw ft0, 120(sp)
fmul.s fa4, fa4, ft0
fmv.s ft3, fa5
flw fa5, 576(s0)
flw ft0, 112(sp)
fmul.s fa5, fa5, ft0
fmv.s ft2, fa6
flw fa6, 16(s0)
flw ft0, 104(sp)
fmul.s fa6, fa6, ft0
fmv.s ft1, fa7
flw fa7, 12(s0)
flw ft0, 96(sp)
fmul.s fa7, fa7, ft0
fmv.s ft0, ft8
flw ft8, 8(s0)
flw fs11, 88(sp)
fmul.s ft8, ft8, fs11
flw fs11, 176(sp)
fadd.s ft8, ft8, fs11
fadd.s fa7, fa7, ft8
fmv.s ft8, ft0
fadd.s fa6, fa6, fa7
fmv.s fa7, ft1
fadd.s fa5, fa5, fa6
fmv.s fa6, ft2
fadd.s fa4, fa4, fa5
fmv.s fa5, ft3
fadd.s fa3, fa3, fa4
fmv.s fa4, ft4
fadd.s fa2, fa2, fa3
fmv.s fa3, ft5
fadd.s fa1, fa1, fa2
fmv.s fa2, ft6
fadd.s fa0, fa0, fa1
fmv.s fa1, ft7
fadd.s ft7, ft11, fa0
fmv.s fa0, ft9
fmv.s ft9, ft10
fadd.s ft6, fs1, ft7
fadd.s ft5, fs2, ft6
fadd.s ft4, fs6, ft5
fmv.s ft5, fs5
fadd.s ft3, fs8, ft4
fmv.s ft4, fs7
fadd.s ft2, fs10, ft3
fmv.s ft3, fs9
flw ft0, 144(sp)
fadd.s ft1, ft0, ft2
flw ft2, 72(sp)
flw ft0, 152(sp)
fadd.s ft0, ft0, ft1
flw ft1, 80(sp)
flw ft11, 160(sp)
fadd.s ft0, ft11, ft0
flw ft11, 168(sp)
fadd.s ft0, ft11, ft0
flw ft11, 184(sp)
fadd.s ft0, ft11, ft0
flw ft11, 192(sp)
fadd.s ft0, ft11, ft0
flw ft11, 200(sp)
fadd.s ft0, ft11, ft0
flw ft11, 208(sp)
fadd.s ft0, ft11, ft0
fsw ft0, 0(s1)
flw ft0, 136(sp)
addi a1, a1, 4
addi a4, a4, 1
addi a2, a2, -1
bnez a2, .LBB9_29
# %bb.30: # %for_end60
# in Loop: Header=BB9_28 Depth=3
addi a0, s7, 1
addiw a1, s7, 1
mv s7, a0
bltu a1, t6, .LBB9_28
# %bb.31: # %for_end57
# in Loop: Header=BB9_27 Depth=2
ld a1, 64(sp)
addi a0, a1, 1
addiw a1, a1, 1
mv a3, a0
addi a0, zero, 32
bltu a1, a0, .LBB9_27
# %bb.32: # %for_end54
# in Loop: Header=BB9_24 Depth=1
ld a1, 16(sp)
addi a0, a1, 1
addiw a1, a1, 1
mv a2, a0
addi a3, zero, 112
addi a0, zero, 64
bltu a1, a0, .LBB9_24
# %bb.33: # %for_begin64.preheader.preheader
ld a0, 56(sp)
addi t5, a0, 28
addi a6, zero, 14
addi t0, zero, 112
addi t1, zero, 784
addi a7, zero, 64
mv t2, zero
.LBB9_34: # %for_begin64.preheader
# =>This Loop Header: Depth=1
# Child Loop BB9_35 Depth 2
srliw a1, t2, 3
mul t3, a1, a6
andi t4, t2, 7
mv a2, zero
mv a3, zero
.LBB9_35: # %for_begin67.preheader
# Parent Loop BB9_34 Depth=1
# => This Inner Loop Header: Depth=2
add s1, a3, t3
mul s1, s1, t0
or s0, s1, t4
add s1, t5, a2
sext.w a5, s0
slli a5, a5, 2
add a5, s9, a5
flw ft0, 0(a5)
fsw ft0, -28(s1)
ori a5, s0, 8
sext.w a5, a5
slli a5, a5, 2
add a5, s9, a5
flw ft0, 0(a5)
fsw ft0, -24(s1)
addiw a5, s0, 16
slli a5, a5, 2
add a5, s9, a5
flw ft0, 0(a5)
fsw ft0, -20(s1)
addiw a5, s0, 48
slli t6, a5, 2
addiw a1, s0, 56
slli s2, a1, 2
addiw a4, s0, 64
slli s3, a4, 2
addiw a0, s0, 72
slli s4, a0, 2
addiw a5, s0, 80
slli s5, a5, 2
addiw a1, s0, 88
slli a1, a1, 2
addiw a4, s0, 96
slli a4, a4, 2
addiw a0, s0, 104
slli a0, a0, 2
addiw a5, s0, 32
slli s6, a5, 2
addiw a5, s0, 40
slli a5, a5, 2
add s7, s9, a0
add s10, s9, a4
add s11, s9, a1
add s5, s9, s5
add s4, s9, s4
add s3, s9, s3
add a0, s9, s2
add a4, s9, t6
add a5, s9, a5
add a1, s9, s6
addiw s0, s0, 24
slli s0, s0, 2
add s0, s9, s0
flw ft0, 0(s0)
fsw ft0, -16(s1)
flw ft0, 0(a1)
fsw ft0, -12(s1)
flw ft0, 0(a5)
fsw ft0, -8(s1)
flw ft0, 0(a4)
fsw ft0, -4(s1)
flw ft0, 0(a0)
fsw ft0, 0(s1)
flw ft0, 0(s3)
fsw ft0, 4(s1)
flw ft0, 0(s4)
fsw ft0, 8(s1)
flw ft0, 0(s5)
fsw ft0, 12(s1)
flw ft0, 0(s11)
fsw ft0, 16(s1)
flw ft0, 0(s10)
fsw ft0, 20(s1)
flw ft0, 0(s7)
fsw ft0, 24(s1)
addi a3, a3, 1
addi a2, a2, 56
bne a2, t1, .LBB9_35
# %bb.36: # %for_end66
# in Loop: Header=BB9_34 Depth=1
addi t5, t5, 784
addi t2, t2, 1
bne t2, a7, .LBB9_34
# %bb.37: # %for_begin70.preheader
ld a0, 24(sp)
addi a0, a0, 28
ld a1, 56(sp)
addi a1, a1, 28
addi a2, zero, 784
addi a3, zero, 64
mv a4, zero
.LBB9_38: # %for_begin73.preheader
# =>This Loop Header: Depth=1
# Child Loop BB9_39 Depth 2
slli a5, a4, 2
ld s1, 32(sp)
add a5, s1, a5
flw ft0, 0(a5)
mv a5, zero
.LBB9_39: # %for_begin76.preheader
# Parent Loop BB9_38 Depth=1
# => This Inner Loop Header: Depth=2
add s1, a0, a5
add s0, a1, a5
flw ft1, -28(s0)
fadd.s ft1, ft0, ft1
fsw ft1, -28(s1)
flw ft1, -24(s0)
fadd.s ft1, ft0, ft1
fsw ft1, -24(s1)
flw ft1, -20(s0)
fadd.s ft1, ft0, ft1
fsw ft1, -20(s1)
flw ft1, -16(s0)
fadd.s ft1, ft0, ft1
fsw ft1, -16(s1)
flw ft1, -12(s0)
fadd.s ft1, ft0, ft1
fsw ft1, -12(s1)
flw ft1, -8(s0)
fadd.s ft1, ft0, ft1
fsw ft1, -8(s1)
flw ft1, -4(s0)
fadd.s ft1, ft0, ft1
fsw ft1, -4(s1)
flw ft1, 0(s0)
fadd.s ft1, ft0, ft1
fsw ft1, 0(s1)
flw ft1, 4(s0)
fadd.s ft1, ft0, ft1
fsw ft1, 4(s1)
flw ft1, 8(s0)
fadd.s ft1, ft0, ft1
fsw ft1, 8(s1)
flw ft1, 12(s0)
fadd.s ft1, ft0, ft1
fsw ft1, 12(s1)
flw ft1, 16(s0)
fadd.s ft1, ft0, ft1
fsw ft1, 16(s1)
flw ft1, 20(s0)
fadd.s ft1, ft0, ft1
fsw ft1, 20(s1)
flw ft1, 24(s0)
fadd.s ft1, ft0, ft1
fsw ft1, 24(s1)
addi a5, a5, 56
bne a5, a2, .LBB9_39
# %bb.40: # %for_end75
# in Loop: Header=BB9_38 Depth=1
addi a0, a0, 784
addi a1, a1, 784
addi a4, a4, 1
bne a4, a3, .LBB9_38
# %bb.41: # %for_end72
mv a0, s9
call _ZdaPv
mv a0, s8
call _ZdaPv
ld a0, 56(sp)
call _ZdaPv
ld s11, 216(sp)
ld s10, 224(sp)
ld s9, 232(sp)
ld s8, 240(sp)
ld s7, 248(sp)
ld s6, 256(sp)
ld s5, 264(sp)
ld s4, 272(sp)
ld s3, 280(sp)
ld s2, 288(sp)
ld s1, 296(sp)
ld s0, 304(sp)
ld ra, 312(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
.cfi_restore s2
.cfi_restore s3
.cfi_restore s4
.cfi_restore s5
.cfi_restore s6
.cfi_restore s7
.cfi_restore s8
.cfi_restore s9
.cfi_restore s10
.cfi_restore s11
addi sp, sp, 320
.cfi_def_cfa_offset 0
ret
.Lfunc_end9:
.size fuse_conv2d_1_compute_, .Lfunc_end9-fuse_conv2d_1_compute_
.cfi_endproc
# -- End function
.globl fuse_relu_1 # -- Begin function fuse_relu_1
.p2align 2
.type fuse_relu_1,@function
fuse_relu_1: # @fuse_relu_1
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -32
.cfi_def_cfa_offset 32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB10_30
# %bb.1: # %assert_end
lwu a4, 4(a1)
ld a2, 8(a0)
lwu a3, 0(a1)
ld a5, 0(a0)
ld t0, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB10_3
# %bb.2: # %if_then
lw a0, 0(a0)
addi s0, zero, 1
bne a0, s0, .LBB10_31
.LBB10_3: # %if_end
ld a7, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld s0, 32(a2)
beqz s0, .LBB10_5
# %bb.4: # %if_then3
lw s0, 0(s0)
addi s1, zero, 1
bne s0, s1, .LBB10_32
.LBB10_5: # %if_end4
addi s1, zero, 13
bltu s1, a3, .LBB10_25
# %bb.6: # %if_end4
addi s1, zero, 1
sll a3, s1, a3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB10_25
# %bb.7: # %assert_end8
addi a3, zero, 13
bltu a3, a4, .LBB10_26
# %bb.8: # %assert_end8
addi a3, zero, 1
sll a4, a3, a4
lui s1, 2
addiw s1, s1, 152
and a4, a4, s1
beqz a4, .LBB10_26
# %bb.9: # %assert_end10
bne t1, a3, .LBB10_33
# %bb.10: # %assert_end12
lw a3, 16(a5)
addi s0, zero, 1
bne a3, s0, .LBB10_34
# %bb.11: # %assert_end14
lhu a3, 22(a5)
bne a3, s0, .LBB10_35
# %bb.12: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB10_35
# %bb.13: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB10_35
# %bb.14: # %assert_end16
lui a3, 3
addiw a3, a3, 256
lw a4, 0(t0)
bne a4, a3, .LBB10_36
# %bb.15: # %assert_end18
ld a3, 40(a5)
bnez a3, .LBB10_37
# %bb.16: # %assert_end20
lw a3, 16(a2)
addi s0, zero, 1
bne a3, s0, .LBB10_38
# %bb.17: # %assert_end22
lhu a3, 22(a2)
bne a3, s0, .LBB10_39
# %bb.18: # %assert_end22
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB10_39
# %bb.19: # %assert_end22
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB10_39
# %bb.20: # %assert_end24
lui a3, 3
addiw a3, a3, 256
lw a4, 0(a7)
bne a4, a3, .LBB10_40
# %bb.21: # %assert_end26
ld a3, 40(a2)
bnez a3, .LBB10_41
# %bb.22: # %assert_end28
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB10_42
# %bb.23: # %assert_end30
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB10_44
# %bb.24: # %assert_end32
call fuse_relu_1_compute_
mv a0, zero
j .LBB10_29
.LBB10_25: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.85)
addi a0, a0, %lo(.L.str.85)
j .LBB10_27
.LBB10_26: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.86)
addi a0, a0, %lo(.L.str.86)
.LBB10_27: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB10_28: # %assert_fail1
addi a0, a0, -1
.LBB10_29: # %assert_fail1
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
addi sp, sp, 32
.cfi_def_cfa_offset 0
ret
.LBB10_30: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.84)
addi a0, a0, %lo(.L.str.84)
j .LBB10_27
.LBB10_31: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.52)
addi a0, a0, %lo(.L.str.52)
j .LBB10_43
.LBB10_32: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.53)
addi a0, a0, %lo(.L.str.53)
jalr a1
slli a0, s1, 32
j .LBB10_28
.LBB10_33: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB10_27
.LBB10_34: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.56)
addi a0, a0, %lo(.L.str.56)
j .LBB10_43
.LBB10_35: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB10_27
.LBB10_36: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.87)
addi a0, a0, %lo(.L.str.87)
j .LBB10_27
.LBB10_37: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB10_27
.LBB10_38: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.58)
addi a0, a0, %lo(.L.str.58)
j .LBB10_43
.LBB10_39: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB10_27
.LBB10_40: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.88)
addi a0, a0, %lo(.L.str.88)
j .LBB10_27
.LBB10_41: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB10_27
.LBB10_42: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB10_43: # %assert_fail1
jalr a1
slli a0, s0, 32
j .LBB10_28
.LBB10_44: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB10_27
.Lfunc_end10:
.size fuse_relu_1, .Lfunc_end10-fuse_relu_1
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_relu_1_compute_
.LCPI11_0:
.word 0 # float 0
.text
.globl fuse_relu_1_compute_
.p2align 2
.type fuse_relu_1_compute_,@function
fuse_relu_1_compute_: # @fuse_relu_1_compute_
# %bb.0: # %entry
lui a2, 3
addiw a2, a2, 256
lui a3, %hi(.LCPI11_0)
addi a3, a3, %lo(.LCPI11_0)
flw ft0, 0(a3)
.LBB11_1: # %for_body
# =>This Inner Loop Header: Depth=1
flw ft1, 0(a1)
fmax.s ft1, ft1, ft0
fsw ft1, 0(a0)
addi a1, a1, 4
addi a0, a0, 4
addi a2, a2, -1
bnez a2, .LBB11_1
# %bb.2: # %for_end
ret
.Lfunc_end11:
.size fuse_relu_1_compute_, .Lfunc_end11-fuse_relu_1_compute_
# -- End function
.globl fuse_max_pool2d_1 # -- Begin function fuse_max_pool2d_1
.p2align 2
.type fuse_max_pool2d_1,@function
fuse_max_pool2d_1: # @fuse_max_pool2d_1
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -16
.cfi_def_cfa_offset 16
sd ra, 8(sp)
sd s0, 0(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB12_42
# %bb.1: # %assert_end
lwu t0, 4(a1)
ld a2, 8(a0)
lwu t3, 0(a1)
ld a5, 0(a0)
ld t2, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB12_6
# %bb.2: # %if_then
lui a3, 3
addiw a3, a3, 256
lw s0, 0(a0)
bne s0, a3, .LBB12_43
# %bb.3: # %if_then
ld a3, 8(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 196
bne a3, s0, .LBB12_43
# %bb.4: # %if_then
ld a3, 16(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 14
bne a3, s0, .LBB12_43
# %bb.5: # %if_then
ld a0, 24(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a3, zero, 1
bne a0, a3, .LBB12_43
.LBB12_6: # %if_end
ld a7, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld a3, 32(a2)
beqz a3, .LBB12_11
# %bb.7: # %if_then3
lui s0, 1
addiw s0, s0, -960
lw a4, 0(a3)
bne a4, s0, .LBB12_44
# %bb.8: # %if_then3
ld a4, 8(a3)
slli a4, a4, 32
srli a4, a4, 32
addi s0, zero, 49
bne a4, s0, .LBB12_44
# %bb.9: # %if_then3
ld a4, 16(a3)
slli a4, a4, 32
srli a4, a4, 32
addi s0, zero, 7
bne a4, s0, .LBB12_44
# %bb.10: # %if_then3
ld a3, 24(a3)
slli a3, a3, 32
srli a3, a3, 32
addi a4, zero, 1
bne a3, a4, .LBB12_44
.LBB12_11: # %if_end4
addi a3, zero, 13
bltu a3, t3, .LBB12_37
# %bb.12: # %if_end4
addi a3, zero, 1
sll a3, a3, t3
lui a4, 2
addiw a4, a4, 152
and a3, a3, a4
beqz a3, .LBB12_37
# %bb.13: # %assert_end8
addi a3, zero, 13
bltu a3, t0, .LBB12_38
# %bb.14: # %assert_end8
addi a3, zero, 1
sll a4, a3, t0
lui s0, 2
addiw s0, s0, 152
and a4, a4, s0
beqz a4, .LBB12_38
# %bb.15: # %assert_end10
bne t1, a3, .LBB12_45
# %bb.16: # %assert_end12
lw a3, 16(a5)
addi a4, zero, 4
bne a3, a4, .LBB12_46
# %bb.17: # %assert_end14
lhu a3, 22(a5)
addi s0, zero, 1
bne a3, s0, .LBB12_47
# %bb.18: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB12_47
# %bb.19: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB12_47
# %bb.20: # %assert_end16
lw a3, 0(t2)
addi s0, zero, 1
bne a3, s0, .LBB12_48
# %bb.21: # %assert_end18
lw a3, 8(t2)
addi a4, zero, 64
bne a3, a4, .LBB12_49
# %bb.22: # %assert_end20
lw a4, 16(t2)
addi a3, zero, 14
bne a4, a3, .LBB12_50
# %bb.23: # %assert_end22
lw a4, 24(t2)
bne a4, a3, .LBB12_51
# %bb.24: # %assert_end24
ld a3, 40(a5)
bnez a3, .LBB12_52
# %bb.25: # %assert_end26
lw a3, 16(a2)
addi a4, zero, 4
bne a3, a4, .LBB12_53
# %bb.26: # %assert_end28
lhu a3, 22(a2)
addi s0, zero, 1
bne a3, s0, .LBB12_54
# %bb.27: # %assert_end28
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB12_54
# %bb.28: # %assert_end28
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB12_54
# %bb.29: # %assert_end30
lw a3, 0(a7)
addi s0, zero, 1
bne a3, s0, .LBB12_55
# %bb.30: # %assert_end32
lw a3, 8(a7)
addi a4, zero, 64
bne a3, a4, .LBB12_56
# %bb.31: # %assert_end34
lw a4, 16(a7)
addi a3, zero, 7
bne a4, a3, .LBB12_57
# %bb.32: # %assert_end36
lw a4, 24(a7)
bne a4, a3, .LBB12_58
# %bb.33: # %assert_end38
ld a3, 40(a2)
bnez a3, .LBB12_59
# %bb.34: # %assert_end40
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB12_60
# %bb.35: # %assert_end42
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB12_62
# %bb.36: # %assert_end44
call fuse_max_pool2d_1_compute_
mv a0, zero
j .LBB12_41
.LBB12_37: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.92)
addi a0, a0, %lo(.L.str.92)
j .LBB12_39
.LBB12_38: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.93)
addi a0, a0, %lo(.L.str.93)
.LBB12_39: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB12_40: # %assert_fail15
addi a0, a0, -1
.LBB12_41: # %assert_fail15
ld s0, 0(sp)
ld ra, 8(sp)
.cfi_restore ra
.cfi_restore s0
addi sp, sp, 16
.cfi_def_cfa_offset 0
ret
.LBB12_42: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.89)
addi a0, a0, %lo(.L.str.89)
j .LBB12_39
.LBB12_43: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.90)
addi a0, a0, %lo(.L.str.90)
j .LBB12_39
.LBB12_44: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.91)
addi a0, a0, %lo(.L.str.91)
j .LBB12_39
.LBB12_45: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB12_39
.LBB12_46: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.29)
addi a0, a0, %lo(.L.str.29)
j .LBB12_39
.LBB12_47: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB12_61
.LBB12_48: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB12_61
.LBB12_49: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.94)
addi a0, a0, %lo(.L.str.94)
j .LBB12_39
.LBB12_50: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.77)
addi a0, a0, %lo(.L.str.77)
j .LBB12_39
.LBB12_51: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.78)
addi a0, a0, %lo(.L.str.78)
j .LBB12_39
.LBB12_52: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB12_39
.LBB12_53: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.11)
addi a0, a0, %lo(.L.str.11)
j .LBB12_39
.LBB12_54: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB12_61
.LBB12_55: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.13)
addi a0, a0, %lo(.L.str.13)
j .LBB12_61
.LBB12_56: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.95)
addi a0, a0, %lo(.L.str.95)
j .LBB12_39
.LBB12_57: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.96)
addi a0, a0, %lo(.L.str.96)
j .LBB12_39
.LBB12_58: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.97)
addi a0, a0, %lo(.L.str.97)
j .LBB12_39
.LBB12_59: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB12_39
.LBB12_60: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB12_61: # %assert_fail15
jalr a1
slli a0, s0, 32
j .LBB12_40
.LBB12_62: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB12_39
.Lfunc_end12:
.size fuse_max_pool2d_1, .Lfunc_end12-fuse_max_pool2d_1
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_max_pool2d_1_compute_
.LCPI13_0:
.word 4286578687 # float -3.40282347E+38
.text
.globl fuse_max_pool2d_1_compute_
.p2align 2
.type fuse_max_pool2d_1_compute_,@function
fuse_max_pool2d_1_compute_: # @fuse_max_pool2d_1_compute_
# %bb.0: # %entry
addi a7, a1, 56
lui a1, %hi(.LCPI13_0)
addi a1, a1, %lo(.LCPI13_0)
flw ft0, 0(a1)
addi a2, zero, 220
addi a6, zero, 64
mv t0, zero
j .LBB13_2
.LBB13_1: # %for_end3
# in Loop: Header=BB13_2 Depth=1
addi a7, a7, 784
addi a0, a0, 196
addi t0, t0, 1
beq t0, a6, .LBB13_60
.LBB13_2: # %for_begin1.preheader
# =>This Loop Header: Depth=1
# Child Loop BB13_4 Depth 2
addi a5, zero, 24
mv a1, a7
j .LBB13_4
.LBB13_3: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fsw ft1, 0(a3)
addi a1, a1, 112
addi a5, a5, 28
beq a5, a2, .LBB13_1
.LBB13_4: # %for_begin4.preheader
# Parent Loop BB13_2 Depth=1
# => This Inner Loop Header: Depth=2
flw ft2, -56(a1)
flt.s a3, ft2, ft0
fmv.s ft1, ft0
bnez a3, .LBB13_6
# %bb.5: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_6: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, -52(a1)
flt.s a3, ft2, ft1
bnez a3, .LBB13_8
# %bb.7: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_8: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 0(a1)
flt.s a3, ft2, ft1
bnez a3, .LBB13_10
# %bb.9: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_10: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 4(a1)
flt.s a3, ft2, ft1
bnez a3, .LBB13_12
# %bb.11: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_12: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
add a3, a0, a5
fsw ft1, -24(a3)
flw ft2, -48(a1)
flt.s a4, ft2, ft0
fmv.s ft1, ft0
bnez a4, .LBB13_14
# %bb.13: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_14: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, -44(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_16
# %bb.15: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_16: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 8(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_18
# %bb.17: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_18: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 12(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_20
# %bb.19: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_20: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fsw ft1, -20(a3)
flw ft2, -40(a1)
flt.s a4, ft2, ft0
fmv.s ft1, ft0
bnez a4, .LBB13_22
# %bb.21: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_22: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, -36(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_24
# %bb.23: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_24: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 16(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_26
# %bb.25: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_26: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 20(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_28
# %bb.27: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_28: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fsw ft1, -16(a3)
flw ft2, -32(a1)
flt.s a4, ft2, ft0
fmv.s ft1, ft0
bnez a4, .LBB13_30
# %bb.29: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_30: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, -28(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_32
# %bb.31: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_32: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 24(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_34
# %bb.33: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_34: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 28(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_36
# %bb.35: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_36: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fsw ft1, -12(a3)
flw ft2, -24(a1)
flt.s a4, ft2, ft0
fmv.s ft1, ft0
bnez a4, .LBB13_38
# %bb.37: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_38: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, -20(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_40
# %bb.39: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_40: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 32(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_42
# %bb.41: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_42: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 36(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_44
# %bb.43: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_44: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fsw ft1, -8(a3)
flw ft2, -16(a1)
flt.s a4, ft2, ft0
fmv.s ft1, ft0
bnez a4, .LBB13_46
# %bb.45: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_46: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, -12(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_48
# %bb.47: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_48: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 40(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_50
# %bb.49: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_50: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 44(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_52
# %bb.51: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_52: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fsw ft1, -4(a3)
flw ft2, -8(a1)
flt.s a4, ft2, ft0
fmv.s ft1, ft0
bnez a4, .LBB13_54
# %bb.53: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_54: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, -4(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_56
# %bb.55: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_56: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 48(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_58
# %bb.57: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
.LBB13_58: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
flw ft2, 52(a1)
flt.s a4, ft2, ft1
bnez a4, .LBB13_3
# %bb.59: # %for_begin4.preheader
# in Loop: Header=BB13_4 Depth=2
fmv.s ft1, ft2
j .LBB13_3
.LBB13_60: # %for_end
ret
.Lfunc_end13:
.size fuse_max_pool2d_1_compute_, .Lfunc_end13-fuse_max_pool2d_1_compute_
# -- End function
.globl fuse_transpose # -- Begin function fuse_transpose
.p2align 2
.type fuse_transpose,@function
fuse_transpose: # @fuse_transpose
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -16
.cfi_def_cfa_offset 16
sd ra, 8(sp)
sd s0, 0(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB14_42
# %bb.1: # %assert_end
lwu t0, 4(a1)
ld a2, 8(a0)
lwu t3, 0(a1)
ld a5, 0(a0)
ld t2, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB14_6
# %bb.2: # %if_then
lui a3, 1
addiw a3, a3, -960
lw s0, 0(a0)
bne s0, a3, .LBB14_43
# %bb.3: # %if_then
ld a3, 8(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 49
bne a3, s0, .LBB14_43
# %bb.4: # %if_then
ld a3, 16(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 7
bne a3, s0, .LBB14_43
# %bb.5: # %if_then
ld a0, 24(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a3, zero, 1
bne a0, a3, .LBB14_43
.LBB14_6: # %if_end
ld a7, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld a3, 32(a2)
beqz a3, .LBB14_11
# %bb.7: # %if_then3
lui s0, 1
addiw s0, s0, -960
lw a4, 0(a3)
bne a4, s0, .LBB14_44
# %bb.8: # %if_then3
ld a4, 8(a3)
slli a4, a4, 32
srli a4, a4, 32
addi s0, zero, 448
bne a4, s0, .LBB14_44
# %bb.9: # %if_then3
ld a4, 16(a3)
slli a4, a4, 32
srli a4, a4, 32
addi s0, zero, 64
bne a4, s0, .LBB14_44
# %bb.10: # %if_then3
ld a3, 24(a3)
slli a3, a3, 32
srli a3, a3, 32
addi a4, zero, 1
bne a3, a4, .LBB14_44
.LBB14_11: # %if_end4
addi a3, zero, 13
bltu a3, t3, .LBB14_37
# %bb.12: # %if_end4
addi a3, zero, 1
sll a3, a3, t3
lui a4, 2
addiw a4, a4, 152
and a3, a3, a4
beqz a3, .LBB14_37
# %bb.13: # %assert_end8
addi a3, zero, 13
bltu a3, t0, .LBB14_38
# %bb.14: # %assert_end8
addi a3, zero, 1
sll a4, a3, t0
lui s0, 2
addiw s0, s0, 152
and a4, a4, s0
beqz a4, .LBB14_38
# %bb.15: # %assert_end10
bne t1, a3, .LBB14_45
# %bb.16: # %assert_end12
lw a3, 16(a5)
addi a4, zero, 4
bne a3, a4, .LBB14_46
# %bb.17: # %assert_end14
lhu a3, 22(a5)
addi s0, zero, 1
bne a3, s0, .LBB14_47
# %bb.18: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB14_47
# %bb.19: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB14_47
# %bb.20: # %assert_end16
lw a3, 0(t2)
addi s0, zero, 1
bne a3, s0, .LBB14_48
# %bb.21: # %assert_end18
lw a3, 8(t2)
addi a4, zero, 64
bne a3, a4, .LBB14_49
# %bb.22: # %assert_end20
lw a4, 16(t2)
addi a3, zero, 7
bne a4, a3, .LBB14_50
# %bb.23: # %assert_end22
lw a4, 24(t2)
bne a4, a3, .LBB14_51
# %bb.24: # %assert_end24
ld a3, 40(a5)
bnez a3, .LBB14_52
# %bb.25: # %assert_end26
lw a3, 16(a2)
addi a4, zero, 4
bne a3, a4, .LBB14_53
# %bb.26: # %assert_end28
lhu a3, 22(a2)
addi s0, zero, 1
bne a3, s0, .LBB14_54
# %bb.27: # %assert_end28
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB14_54
# %bb.28: # %assert_end28
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB14_54
# %bb.29: # %assert_end30
lw a3, 0(a7)
addi s0, zero, 1
bne a3, s0, .LBB14_55
# %bb.30: # %assert_end32
lw a4, 8(a7)
addi a3, zero, 7
bne a4, a3, .LBB14_56
# %bb.31: # %assert_end34
lw a4, 16(a7)
bne a4, a3, .LBB14_57
# %bb.32: # %assert_end36
lw a3, 24(a7)
addi a4, zero, 64
bne a3, a4, .LBB14_58
# %bb.33: # %assert_end38
ld a3, 40(a2)
bnez a3, .LBB14_59
# %bb.34: # %assert_end40
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB14_60
# %bb.35: # %assert_end42
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB14_62
# %bb.36: # %assert_end44
call fuse_transpose_compute_
mv a0, zero
j .LBB14_41
.LBB14_37: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.101)
addi a0, a0, %lo(.L.str.101)
j .LBB14_39
.LBB14_38: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.102)
addi a0, a0, %lo(.L.str.102)
.LBB14_39: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB14_40: # %assert_fail15
addi a0, a0, -1
.LBB14_41: # %assert_fail15
ld s0, 0(sp)
ld ra, 8(sp)
.cfi_restore ra
.cfi_restore s0
addi sp, sp, 16
.cfi_def_cfa_offset 0
ret
.LBB14_42: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.98)
addi a0, a0, %lo(.L.str.98)
j .LBB14_39
.LBB14_43: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.99)
addi a0, a0, %lo(.L.str.99)
j .LBB14_39
.LBB14_44: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.100)
addi a0, a0, %lo(.L.str.100)
j .LBB14_39
.LBB14_45: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB14_39
.LBB14_46: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.29)
addi a0, a0, %lo(.L.str.29)
j .LBB14_39
.LBB14_47: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB14_61
.LBB14_48: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB14_61
.LBB14_49: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.94)
addi a0, a0, %lo(.L.str.94)
j .LBB14_39
.LBB14_50: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.103)
addi a0, a0, %lo(.L.str.103)
j .LBB14_39
.LBB14_51: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.104)
addi a0, a0, %lo(.L.str.104)
j .LBB14_39
.LBB14_52: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB14_39
.LBB14_53: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.11)
addi a0, a0, %lo(.L.str.11)
j .LBB14_39
.LBB14_54: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB14_61
.LBB14_55: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.13)
addi a0, a0, %lo(.L.str.13)
j .LBB14_61
.LBB14_56: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.105)
addi a0, a0, %lo(.L.str.105)
j .LBB14_39
.LBB14_57: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.96)
addi a0, a0, %lo(.L.str.96)
j .LBB14_39
.LBB14_58: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.106)
addi a0, a0, %lo(.L.str.106)
j .LBB14_39
.LBB14_59: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB14_39
.LBB14_60: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB14_61: # %assert_fail15
jalr a1
slli a0, s0, 32
j .LBB14_40
.LBB14_62: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB14_39
.Lfunc_end14:
.size fuse_transpose, .Lfunc_end14-fuse_transpose
.cfi_endproc
# -- End function
.globl fuse_transpose_compute_ # -- Begin function fuse_transpose_compute_
.p2align 2
.type fuse_transpose_compute_,@function
fuse_transpose_compute_: # @fuse_transpose_compute_
# %bb.0: # %entry
addi sp, sp, -48
sd s0, 40(sp)
sd s1, 32(sp)
sd s2, 24(sp)
sd s3, 16(sp)
sd s4, 8(sp)
addi a6, a1, 24
addi a7, a1, 20
addi t0, a1, 16
addi t1, a1, 12
addi t2, a1, 8
addi t3, a1, 4
addi t4, zero, 256
addi t5, zero, 512
addi t6, zero, 768
addi s4, zero, 1024
addi a4, zero, 1280
addi a5, zero, 1536
addi a2, zero, 1792
addi s2, zero, 7
mv s3, zero
.LBB15_1: # %for_begin1.preheader
# =>This Loop Header: Depth=1
# Child Loop BB15_2 Depth 2
# Child Loop BB15_4 Depth 2
# Child Loop BB15_6 Depth 2
# Child Loop BB15_8 Depth 2
# Child Loop BB15_10 Depth 2
# Child Loop BB15_12 Depth 2
# Child Loop BB15_14 Depth 2
mv s0, a1
mv s1, zero
.LBB15_2: # %for_body5
# Parent Loop BB15_1 Depth=1
# => This Inner Loop Header: Depth=2
add a3, a0, s1
flw ft0, 0(s0)
fsw ft0, 0(a3)
addi s0, s0, 196
addi s1, s1, 4
bne s1, t4, .LBB15_2
# %bb.3: # %for_end6
# in Loop: Header=BB15_1 Depth=1
addi s0, zero, 256
mv s1, t3
.LBB15_4: # %for_body5.1
# Parent Loop BB15_1 Depth=1
# => This Inner Loop Header: Depth=2
add a3, a0, s0
flw ft0, 0(s1)
fsw ft0, 0(a3)
addi s1, s1, 196
addi s0, s0, 4
bne s0, t5, .LBB15_4
# %bb.5: # %for_end6.1
# in Loop: Header=BB15_1 Depth=1
addi s0, zero, 512
mv s1, t2
.LBB15_6: # %for_body5.2
# Parent Loop BB15_1 Depth=1
# => This Inner Loop Header: Depth=2
add a3, a0, s0
flw ft0, 0(s1)
fsw ft0, 0(a3)
addi s1, s1, 196
addi s0, s0, 4
bne s0, t6, .LBB15_6
# %bb.7: # %for_end6.2
# in Loop: Header=BB15_1 Depth=1
addi s0, zero, 768
mv s1, t1
.LBB15_8: # %for_body5.3
# Parent Loop BB15_1 Depth=1
# => This Inner Loop Header: Depth=2
add a3, a0, s0
flw ft0, 0(s1)
fsw ft0, 0(a3)
addi s1, s1, 196
addi s0, s0, 4
bne s0, s4, .LBB15_8
# %bb.9: # %for_end6.3
# in Loop: Header=BB15_1 Depth=1
addi s0, zero, 1024
mv s1, t0
.LBB15_10: # %for_body5.4
# Parent Loop BB15_1 Depth=1
# => This Inner Loop Header: Depth=2
add a3, a0, s0
flw ft0, 0(s1)
fsw ft0, 0(a3)
addi s1, s1, 196
addi s0, s0, 4
bne s0, a4, .LBB15_10
# %bb.11: # %for_end6.4
# in Loop: Header=BB15_1 Depth=1
addi s0, zero, 1280
mv s1, a7
.LBB15_12: # %for_body5.5
# Parent Loop BB15_1 Depth=1
# => This Inner Loop Header: Depth=2
add a3, a0, s0
flw ft0, 0(s1)
fsw ft0, 0(a3)
addi s1, s1, 196
addi s0, s0, 4
bne s0, a5, .LBB15_12
# %bb.13: # %for_end6.5
# in Loop: Header=BB15_1 Depth=1
addi s0, zero, 1536
mv s1, a6
.LBB15_14: # %for_body5.6
# Parent Loop BB15_1 Depth=1
# => This Inner Loop Header: Depth=2
add a3, a0, s0
flw ft0, 0(s1)
fsw ft0, 0(a3)
addi s1, s1, 196
addi s0, s0, 4
bne s0, a2, .LBB15_14
# %bb.15: # %for_end6.6
# in Loop: Header=BB15_1 Depth=1
addi a6, a6, 28
addi a7, a7, 28
addi t0, t0, 28
addi t1, t1, 28
addi t2, t2, 28
addi t3, t3, 28
addi a0, a0, 1792
addi a1, a1, 28
addi s3, s3, 1
bne s3, s2, .LBB15_1
# %bb.16: # %for_end
ld s4, 8(sp)
ld s3, 16(sp)
ld s2, 24(sp)
ld s1, 32(sp)
ld s0, 40(sp)
addi sp, sp, 48
ret
.Lfunc_end15:
.size fuse_transpose_compute_, .Lfunc_end15-fuse_transpose_compute_
# -- End function
.globl fuse_reshape_1 # -- Begin function fuse_reshape_1
.p2align 2
.type fuse_reshape_1,@function
fuse_reshape_1: # @fuse_reshape_1
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -16
.cfi_def_cfa_offset 16
sd ra, 8(sp)
sd s0, 0(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB16_38
# %bb.1: # %assert_end
lwu t0, 4(a1)
ld a2, 8(a0)
lwu t3, 0(a1)
ld a4, 0(a0)
ld t2, 24(a4)
ld a1, 0(a4)
ld a0, 32(a4)
beqz a0, .LBB16_6
# %bb.2: # %if_then
lui s0, 1
addiw s0, s0, -960
lw a3, 0(a0)
bne a3, s0, .LBB16_39
# %bb.3: # %if_then
ld a3, 8(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 448
bne a3, s0, .LBB16_39
# %bb.4: # %if_then
ld a3, 16(a0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 64
bne a3, s0, .LBB16_39
# %bb.5: # %if_then
ld a0, 24(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a3, zero, 1
bne a0, a3, .LBB16_39
.LBB16_6: # %if_end
ld a7, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a4)
lwu t1, 8(a4)
ld s0, 32(a2)
beqz s0, .LBB16_9
# %bb.7: # %if_then3
lui a3, 1
addiw a3, a3, -960
lw a5, 0(s0)
bne a5, a3, .LBB16_40
# %bb.8: # %if_then3
ld a3, 8(s0)
slli a3, a3, 32
srli a3, a3, 32
addi a5, zero, 1
bne a3, a5, .LBB16_40
.LBB16_9: # %if_end4
addi a3, zero, 13
bltu a3, t3, .LBB16_33
# %bb.10: # %if_end4
addi a3, zero, 1
sll a3, a3, t3
lui a5, 2
addiw a5, a5, 152
and a3, a3, a5
beqz a3, .LBB16_33
# %bb.11: # %assert_end8
addi a3, zero, 13
bltu a3, t0, .LBB16_34
# %bb.12: # %assert_end8
addi a5, zero, 1
sll a3, a5, t0
lui s0, 2
addiw s0, s0, 152
and a3, a3, s0
beqz a3, .LBB16_34
# %bb.13: # %assert_end10
bne t1, a5, .LBB16_41
# %bb.14: # %assert_end12
lw a3, 16(a4)
addi a5, zero, 4
bne a3, a5, .LBB16_42
# %bb.15: # %assert_end14
lhu a3, 22(a4)
addi s0, zero, 1
bne a3, s0, .LBB16_43
# %bb.16: # %assert_end14
lbu a3, 21(a4)
addi a5, zero, 32
bne a3, a5, .LBB16_43
# %bb.17: # %assert_end14
lbu a3, 20(a4)
addi a5, zero, 2
bne a3, a5, .LBB16_43
# %bb.18: # %assert_end16
lw a3, 0(t2)
addi s0, zero, 1
bne a3, s0, .LBB16_44
# %bb.19: # %assert_end18
lw a3, 8(t2)
addi a5, zero, 7
bne a3, a5, .LBB16_45
# %bb.20: # %assert_end20
lw a3, 16(t2)
bne a3, a5, .LBB16_46
# %bb.21: # %assert_end22
lw a3, 24(t2)
addi a5, zero, 64
bne a3, a5, .LBB16_47
# %bb.22: # %assert_end24
ld a3, 40(a4)
bnez a3, .LBB16_48
# %bb.23: # %assert_end26
lw a3, 16(a2)
addi a4, zero, 2
bne a3, a4, .LBB16_49
# %bb.24: # %assert_end28
lhu a3, 22(a2)
addi s0, zero, 1
bne a3, s0, .LBB16_50
# %bb.25: # %assert_end28
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB16_50
# %bb.26: # %assert_end28
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB16_50
# %bb.27: # %assert_end30
lw a3, 0(a7)
addi s0, zero, 1
bne a3, s0, .LBB16_51
# %bb.28: # %assert_end32
lui a3, 1
addiw a3, a3, -960
lw a4, 8(a7)
bne a4, a3, .LBB16_52
# %bb.29: # %assert_end34
ld a3, 40(a2)
bnez a3, .LBB16_53
# %bb.30: # %assert_end36
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB16_54
# %bb.31: # %assert_end38
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB16_56
# %bb.32: # %assert_end40
call fuse_reshape_1_compute_
mv a0, zero
j .LBB16_37
.LBB16_33: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.110)
addi a0, a0, %lo(.L.str.110)
j .LBB16_35
.LBB16_34: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.111)
addi a0, a0, %lo(.L.str.111)
.LBB16_35: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB16_36: # %assert_fail15
addi a0, a0, -1
.LBB16_37: # %assert_fail15
ld s0, 0(sp)
ld ra, 8(sp)
.cfi_restore ra
.cfi_restore s0
addi sp, sp, 16
.cfi_def_cfa_offset 0
ret
.LBB16_38: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.107)
addi a0, a0, %lo(.L.str.107)
j .LBB16_35
.LBB16_39: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.108)
addi a0, a0, %lo(.L.str.108)
j .LBB16_35
.LBB16_40: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.109)
addi a0, a0, %lo(.L.str.109)
j .LBB16_35
.LBB16_41: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB16_35
.LBB16_42: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.29)
addi a0, a0, %lo(.L.str.29)
j .LBB16_35
.LBB16_43: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB16_55
.LBB16_44: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB16_55
.LBB16_45: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.112)
addi a0, a0, %lo(.L.str.112)
j .LBB16_35
.LBB16_46: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.103)
addi a0, a0, %lo(.L.str.103)
j .LBB16_35
.LBB16_47: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.113)
addi a0, a0, %lo(.L.str.113)
j .LBB16_35
.LBB16_48: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB16_35
.LBB16_49: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.114)
addi a0, a0, %lo(.L.str.114)
j .LBB16_35
.LBB16_50: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB16_55
.LBB16_51: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.13)
addi a0, a0, %lo(.L.str.13)
j .LBB16_55
.LBB16_52: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.115)
addi a0, a0, %lo(.L.str.115)
j .LBB16_35
.LBB16_53: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB16_35
.LBB16_54: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB16_55: # %assert_fail15
jalr a1
slli a0, s0, 32
j .LBB16_36
.LBB16_56: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB16_35
.Lfunc_end16:
.size fuse_reshape_1, .Lfunc_end16-fuse_reshape_1
.cfi_endproc
# -- End function
.globl fuse_reshape_1_compute_ # -- Begin function fuse_reshape_1_compute_
.p2align 2
.type fuse_reshape_1_compute_,@function
fuse_reshape_1_compute_: # @fuse_reshape_1_compute_
# %bb.0: # %entry
addi sp, sp, -16
sd ra, 8(sp)
lui a2, 3
addiw a2, a2, 256
call memcpy
ld ra, 8(sp)
addi sp, sp, 16
ret
.Lfunc_end17:
.size fuse_reshape_1_compute_, .Lfunc_end17-fuse_reshape_1_compute_
# -- End function
.globl fuse_matmul # -- Begin function fuse_matmul
.p2align 2
.type fuse_matmul,@function
fuse_matmul: # @fuse_matmul
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -32
.cfi_def_cfa_offset 32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 3
bne a2, a3, .LBB18_49
# %bb.1: # %assert_end
lwu t2, 8(a1)
ld t5, 16(a0)
lwu t3, 4(a1)
ld a4, 8(a0)
lwu t6, 0(a1)
ld a5, 0(a0)
ld t1, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB18_4
# %bb.2: # %if_then
lui a2, 1
addiw a2, a2, -960
lw s0, 0(a0)
bne s0, a2, .LBB18_50
# %bb.3: # %if_then
ld a0, 8(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a2, zero, 1
bne a0, a2, .LBB18_50
.LBB18_4: # %if_end
ld t0, 24(a4)
ld a2, 0(a4)
lwu a6, 12(a5)
lwu t4, 8(a5)
ld a0, 32(a4)
beqz a0, .LBB18_7
# %bb.5: # %if_then3
lw s0, 0(a0)
addi a3, zero, 100
bne s0, a3, .LBB18_51
# %bb.6: # %if_then3
ld a0, 8(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a3, zero, 1
bne a0, a3, .LBB18_51
.LBB18_7: # %if_end4
ld a7, 24(t5)
ld a0, 0(t5)
ld s0, 32(t5)
beqz s0, .LBB18_10
# %bb.8: # %if_then7
lw a3, 0(s0)
addi s1, zero, 100
bne a3, s1, .LBB18_52
# %bb.9: # %if_then7
ld a3, 8(s0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 1
bne a3, s0, .LBB18_52
.LBB18_10: # %if_end8
addi a3, zero, 13
bltu a3, t6, .LBB18_43
# %bb.11: # %if_end8
addi a3, zero, 1
sll a3, a3, t6
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB18_43
# %bb.12: # %assert_end12
addi a3, zero, 13
bltu a3, t3, .LBB18_44
# %bb.13: # %assert_end12
addi a3, zero, 1
sll a3, a3, t3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB18_44
# %bb.14: # %assert_end14
addi a3, zero, 13
bltu a3, t2, .LBB18_45
# %bb.15: # %assert_end14
addi a3, zero, 1
sll s1, a3, t2
lui s0, 2
addiw s0, s0, 152
and s1, s1, s0
beqz s1, .LBB18_45
# %bb.16: # %assert_end16
bne t4, a3, .LBB18_53
# %bb.17: # %assert_end18
lw a3, 16(a5)
addi s1, zero, 2
bne a3, s1, .LBB18_54
# %bb.18: # %assert_end20
lhu a3, 22(a5)
addi s0, zero, 1
bne a3, s0, .LBB18_55
# %bb.19: # %assert_end20
lbu a3, 21(a5)
addi s1, zero, 32
bne a3, s1, .LBB18_55
# %bb.20: # %assert_end20
lbu a3, 20(a5)
addi s1, zero, 2
bne a3, s1, .LBB18_55
# %bb.21: # %assert_end22
lw a3, 0(t1)
addi s0, zero, 1
bne a3, s0, .LBB18_56
# %bb.22: # %assert_end24
lui a3, 1
addiw a3, a3, -960
lw s1, 8(t1)
bne s1, a3, .LBB18_57
# %bb.23: # %assert_end26
ld a3, 40(a5)
bnez a3, .LBB18_58
# %bb.24: # %assert_end28
lw a3, 16(a4)
addi a5, zero, 2
bne a3, a5, .LBB18_59
# %bb.25: # %assert_end30
lhu a3, 22(a4)
addi s0, zero, 1
bne a3, s0, .LBB18_60
# %bb.26: # %assert_end30
lbu a3, 21(a4)
addi a5, zero, 32
bne a3, a5, .LBB18_60
# %bb.27: # %assert_end30
lbu a3, 20(a4)
addi a5, zero, 2
bne a3, a5, .LBB18_60
# %bb.28: # %assert_end32
lui a3, 1
addiw a3, a3, -960
lw a5, 0(t0)
bne a5, a3, .LBB18_61
# %bb.29: # %assert_end34
lw a3, 8(t0)
addi a5, zero, 100
bne a3, a5, .LBB18_62
# %bb.30: # %assert_end36
ld a3, 40(a4)
bnez a3, .LBB18_63
# %bb.31: # %assert_end38
lw a3, 8(a4)
addi s0, zero, 1
bne a3, s0, .LBB18_64
# %bb.32: # %assert_end40
lw a4, 12(a4)
sext.w a3, a6
bne a3, a4, .LBB18_65
# %bb.33: # %assert_end42
lw a4, 16(t5)
addi a5, zero, 2
bne a4, a5, .LBB18_66
# %bb.34: # %assert_end44
lhu a4, 22(t5)
addi s0, zero, 1
bne a4, s0, .LBB18_67
# %bb.35: # %assert_end44
lbu a4, 21(t5)
addi a5, zero, 32
bne a4, a5, .LBB18_67
# %bb.36: # %assert_end44
lbu a4, 20(t5)
addi a5, zero, 2
bne a4, a5, .LBB18_67
# %bb.37: # %assert_end46
lw a4, 0(a7)
addi s0, zero, 1
bne a4, s0, .LBB18_68
# %bb.38: # %assert_end48
lw a4, 8(a7)
addi a5, zero, 100
bne a4, a5, .LBB18_69
# %bb.39: # %assert_end50
ld a4, 40(t5)
bnez a4, .LBB18_70
# %bb.40: # %assert_end52
lw a4, 8(t5)
addi s0, zero, 1
bne a4, s0, .LBB18_71
# %bb.41: # %assert_end54
lw a4, 12(t5)
bne a3, a4, .LBB18_73
# %bb.42: # %assert_end56
call fuse_matmul_compute_
mv a0, zero
j .LBB18_48
.LBB18_43: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.120)
addi a0, a0, %lo(.L.str.120)
j .LBB18_46
.LBB18_44: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.121)
addi a0, a0, %lo(.L.str.121)
j .LBB18_46
.LBB18_45: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.122)
addi a0, a0, %lo(.L.str.122)
.LBB18_46: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB18_47: # %assert_fail21
addi a0, a0, -1
.LBB18_48: # %assert_fail21
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
addi sp, sp, 32
.cfi_def_cfa_offset 0
ret
.LBB18_49: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.116)
addi a0, a0, %lo(.L.str.116)
j .LBB18_46
.LBB18_50: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.117)
addi a0, a0, %lo(.L.str.117)
j .LBB18_46
.LBB18_51: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.118)
addi a0, a0, %lo(.L.str.118)
j .LBB18_46
.LBB18_52: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.119)
addi a0, a0, %lo(.L.str.119)
j .LBB18_46
.LBB18_53: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB18_46
.LBB18_54: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.6)
addi a0, a0, %lo(.L.str.6)
j .LBB18_46
.LBB18_55: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB18_72
.LBB18_56: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB18_72
.LBB18_57: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.123)
addi a0, a0, %lo(.L.str.123)
j .LBB18_46
.LBB18_58: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB18_46
.LBB18_59: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.114)
addi a0, a0, %lo(.L.str.114)
j .LBB18_46
.LBB18_60: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB18_72
.LBB18_61: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.124)
addi a0, a0, %lo(.L.str.124)
j .LBB18_46
.LBB18_62: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.125)
addi a0, a0, %lo(.L.str.125)
j .LBB18_46
.LBB18_63: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB18_46
.LBB18_64: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
j .LBB18_72
.LBB18_65: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB18_46
.LBB18_66: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.126)
addi a0, a0, %lo(.L.str.126)
j .LBB18_46
.LBB18_67: # %assert_fail45
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.37)
addi a0, a0, %lo(.L.str.37)
j .LBB18_72
.LBB18_68: # %assert_fail47
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.127)
addi a0, a0, %lo(.L.str.127)
j .LBB18_72
.LBB18_69: # %assert_fail49
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.128)
addi a0, a0, %lo(.L.str.128)
j .LBB18_46
.LBB18_70: # %assert_fail51
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.39)
addi a0, a0, %lo(.L.str.39)
j .LBB18_46
.LBB18_71: # %assert_fail53
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.40)
addi a0, a0, %lo(.L.str.40)
.LBB18_72: # %assert_fail21
jalr a1
slli a0, s0, 32
j .LBB18_47
.LBB18_73: # %assert_fail55
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.41)
addi a0, a0, %lo(.L.str.41)
j .LBB18_46
.Lfunc_end18:
.size fuse_matmul, .Lfunc_end18-fuse_matmul
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_matmul_compute_
.LCPI19_0:
.word 0 # float 0
.text
.globl fuse_matmul_compute_
.p2align 2
.type fuse_matmul_compute_,@function
fuse_matmul_compute_: # @fuse_matmul_compute_
# %bb.0: # %entry
lui a3, %hi(.LCPI19_0)
addi a3, a3, %lo(.LCPI19_0)
flw ft0, 0(a3)
fmv.x.w a3, ft0
vmv.v.x v0, a3
vslide1up.vx v1, v0, a3
vslide1up.vx v0, v1, a3
vslide1up.vx v1, v0, a3
vslide1up.vx v0, v1, a3
lui a3, 1
addiw a7, a3, -960
addi t1, zero, 8
addi t2, zero, 4
addi a6, zero, 25
mv t0, zero
.LBB19_1: # %for_body
# =>This Loop Header: Depth=1
# Child Loop BB19_2 Depth 2
slli a3, t0, 4
add t3, a0, a3
vse.v v0, ( t3 )
mv t4, a1
mv a5, a2
mv a3, a7
.LBB19_2: # %for_body2
# Parent Loop BB19_1 Depth=1
# => This Inner Loop Header: Depth=2
flw ft0, 0(t4)
vsetvl a4, t2, t1
vle.v v1, ( a5 )
vsetvl a4, t2, t1
fmv.x.w a4, ft0
vmv.v.x v2, a4
vslide1up.vx v3, v2, a4
vslide1up.vx v2, v3, a4
vslide1up.vx v3, v2, a4
vslide1up.vx v2, v3, a4
vfmul.vv v1, v2, v1
vle.v v2, ( t3 )
vfadd.vv v1, v1, v2
vse.v v1, ( t3 )
addi t4, t4, 4
addi a5, a5, 400
addi a3, a3, -1
bnez a3, .LBB19_2
# %bb.3: # %for_end3
# in Loop: Header=BB19_1 Depth=1
addi a2, a2, 16
addi t0, t0, 1
bne t0, a6, .LBB19_1
# %bb.4: # %for_end
ret
.Lfunc_end19:
.size fuse_matmul_compute_, .Lfunc_end19-fuse_matmul_compute_
# -- End function
.globl fuse_elemwise_add # -- Begin function fuse_elemwise_add
.p2align 2
.type fuse_elemwise_add,@function
fuse_elemwise_add: # @fuse_elemwise_add
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -32
.cfi_def_cfa_offset 32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 3
bne a2, a3, .LBB20_43
# %bb.1: # %assert_end
lwu t2, 8(a1)
ld t5, 16(a0)
lwu t3, 4(a1)
ld a4, 8(a0)
lwu a3, 0(a1)
ld a5, 0(a0)
ld t1, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB20_3
# %bb.2: # %if_then
lw a0, 0(a0)
addi s0, zero, 1
bne a0, s0, .LBB20_44
.LBB20_3: # %if_end
ld t0, 24(a4)
ld a2, 0(a4)
lwu a7, 12(a5)
lwu t4, 8(a5)
ld a0, 32(a4)
beqz a0, .LBB20_5
# %bb.4: # %if_then3
lw a0, 0(a0)
addi s0, zero, 1
bne a0, s0, .LBB20_45
.LBB20_5: # %if_end4
ld a6, 24(t5)
ld a0, 0(t5)
ld s0, 32(t5)
beqz s0, .LBB20_7
# %bb.6: # %if_then7
lw s0, 0(s0)
addi s1, zero, 1
bne s0, s1, .LBB20_46
.LBB20_7: # %if_end8
addi s1, zero, 13
bltu s1, a3, .LBB20_37
# %bb.8: # %if_end8
addi s1, zero, 1
sll a3, s1, a3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB20_37
# %bb.9: # %assert_end12
addi a3, zero, 13
bltu a3, t3, .LBB20_38
# %bb.10: # %assert_end12
addi a3, zero, 1
sll a3, a3, t3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB20_38
# %bb.11: # %assert_end14
addi a3, zero, 13
bltu a3, t2, .LBB20_39
# %bb.12: # %assert_end14
addi a3, zero, 1
sll s1, a3, t2
lui s0, 2
addiw s0, s0, 152
and s1, s1, s0
beqz s1, .LBB20_39
# %bb.13: # %assert_end16
bne t4, a3, .LBB20_47
# %bb.14: # %assert_end18
lw a3, 16(a5)
addi s0, zero, 1
bne a3, s0, .LBB20_48
# %bb.15: # %assert_end20
lhu a3, 22(a5)
bne a3, s0, .LBB20_49
# %bb.16: # %assert_end20
lbu a3, 21(a5)
addi s1, zero, 32
bne a3, s1, .LBB20_49
# %bb.17: # %assert_end20
lbu a3, 20(a5)
addi s1, zero, 2
bne a3, s1, .LBB20_49
# %bb.18: # %assert_end22
lw a3, 0(t1)
addi s1, zero, 100
bne a3, s1, .LBB20_50
# %bb.19: # %assert_end24
ld a3, 40(a5)
bnez a3, .LBB20_51
# %bb.20: # %assert_end26
lw a3, 16(a4)
addi s0, zero, 1
bne a3, s0, .LBB20_52
# %bb.21: # %assert_end28
lhu a3, 22(a4)
bne a3, s0, .LBB20_53
# %bb.22: # %assert_end28
lbu a3, 21(a4)
addi a5, zero, 32
bne a3, a5, .LBB20_53
# %bb.23: # %assert_end28
lbu a3, 20(a4)
addi a5, zero, 2
bne a3, a5, .LBB20_53
# %bb.24: # %assert_end30
lw a3, 0(t0)
addi a5, zero, 100
bne a3, a5, .LBB20_54
# %bb.25: # %assert_end32
ld a3, 40(a4)
bnez a3, .LBB20_55
# %bb.26: # %assert_end34
lw a3, 8(a4)
addi s0, zero, 1
bne a3, s0, .LBB20_56
# %bb.27: # %assert_end36
lw a4, 12(a4)
sext.w a3, a7
bne a3, a4, .LBB20_57
# %bb.28: # %assert_end38
lw a4, 16(t5)
addi s0, zero, 1
bne a4, s0, .LBB20_58
# %bb.29: # %assert_end40
lhu a4, 22(t5)
bne a4, s0, .LBB20_59
# %bb.30: # %assert_end40
lbu a4, 21(t5)
addi a5, zero, 32
bne a4, a5, .LBB20_59
# %bb.31: # %assert_end40
lbu a4, 20(t5)
addi a5, zero, 2
bne a4, a5, .LBB20_59
# %bb.32: # %assert_end42
lw a4, 0(a6)
addi a5, zero, 100
bne a4, a5, .LBB20_60
# %bb.33: # %assert_end44
ld a4, 40(t5)
bnez a4, .LBB20_61
# %bb.34: # %assert_end46
lw a4, 8(t5)
addi s0, zero, 1
bne a4, s0, .LBB20_62
# %bb.35: # %assert_end48
lw a4, 12(t5)
bne a3, a4, .LBB20_64
# %bb.36: # %assert_end50
call fuse_elemwise_add_compute_
mv a0, zero
j .LBB20_42
.LBB20_37: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.130)
addi a0, a0, %lo(.L.str.130)
j .LBB20_40
.LBB20_38: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.131)
addi a0, a0, %lo(.L.str.131)
j .LBB20_40
.LBB20_39: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.132)
addi a0, a0, %lo(.L.str.132)
.LBB20_40: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB20_41: # %assert_fail1
addi a0, a0, -1
.LBB20_42: # %assert_fail1
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
addi sp, sp, 32
.cfi_def_cfa_offset 0
ret
.LBB20_43: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.129)
addi a0, a0, %lo(.L.str.129)
j .LBB20_40
.LBB20_44: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.52)
addi a0, a0, %lo(.L.str.52)
j .LBB20_63
.LBB20_45: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.53)
addi a0, a0, %lo(.L.str.53)
j .LBB20_63
.LBB20_46: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.23)
addi a0, a0, %lo(.L.str.23)
jalr a1
slli a0, s1, 32
j .LBB20_41
.LBB20_47: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB20_40
.LBB20_48: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.56)
addi a0, a0, %lo(.L.str.56)
j .LBB20_63
.LBB20_49: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB20_40
.LBB20_50: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.133)
addi a0, a0, %lo(.L.str.133)
j .LBB20_40
.LBB20_51: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB20_40
.LBB20_52: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.58)
addi a0, a0, %lo(.L.str.58)
j .LBB20_63
.LBB20_53: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB20_40
.LBB20_54: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.134)
addi a0, a0, %lo(.L.str.134)
j .LBB20_40
.LBB20_55: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB20_40
.LBB20_56: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
j .LBB20_63
.LBB20_57: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB20_40
.LBB20_58: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.36)
addi a0, a0, %lo(.L.str.36)
j .LBB20_63
.LBB20_59: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.37)
addi a0, a0, %lo(.L.str.37)
j .LBB20_40
.LBB20_60: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.135)
addi a0, a0, %lo(.L.str.135)
j .LBB20_40
.LBB20_61: # %assert_fail45
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.39)
addi a0, a0, %lo(.L.str.39)
j .LBB20_40
.LBB20_62: # %assert_fail47
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.40)
addi a0, a0, %lo(.L.str.40)
.LBB20_63: # %assert_fail1
jalr a1
slli a0, s0, 32
j .LBB20_41
.LBB20_64: # %assert_fail49
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.41)
addi a0, a0, %lo(.L.str.41)
j .LBB20_40
.Lfunc_end20:
.size fuse_elemwise_add, .Lfunc_end20-fuse_elemwise_add
.cfi_endproc
# -- End function
.globl fuse_elemwise_add_compute_ # -- Begin function fuse_elemwise_add_compute_
.p2align 2
.type fuse_elemwise_add_compute_,@function
fuse_elemwise_add_compute_: # @fuse_elemwise_add_compute_
# %bb.0: # %entry
addi a3, zero, 8
addi a4, zero, 4
vsetvl a5, a4, a3
vle.v v0, ( a2 )
vsetvl a5, a4, a3
vle.v v1, ( a1 )
vfadd.vv v0, v0, v1
vse.v v0, ( a0 )
vsetvl a5, a4, a3
addi a5, a2, 16
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 16
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 16
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 32
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 32
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 32
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 48
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 48
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 48
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 64
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 64
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 64
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 80
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 80
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 80
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 96
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 96
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 96
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 112
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 112
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 112
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 128
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 128
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 128
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 144
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 144
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 144
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 160
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 160
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 160
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 176
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 176
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 176
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 192
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 192
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 192
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 208
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 208
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 208
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 224
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 224
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 224
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 240
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 240
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 240
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 256
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 256
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 256
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 272
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 272
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 272
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 288
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 288
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 288
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 304
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 304
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 304
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 320
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 320
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 320
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 336
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 336
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 336
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 352
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 352
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 352
vse.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a2, 368
vle.v v0, ( a5 )
vsetvl a5, a4, a3
addi a5, a1, 368
vle.v v1, ( a5 )
vfadd.vv v0, v0, v1
addi a5, a0, 368
vse.v v0, ( a5 )
addi a2, a2, 384
vsetvl a5, a4, a3
vle.v v0, ( a2 )
vsetvl a2, a4, a3
addi a1, a1, 384
vle.v v1, ( a1 )
vfadd.vv v0, v0, v1
addi a0, a0, 384
vse.v v0, ( a0 )
ret
.Lfunc_end21:
.size fuse_elemwise_add_compute_, .Lfunc_end21-fuse_elemwise_add_compute_
# -- End function
.globl fuse_sigmoid # -- Begin function fuse_sigmoid
.p2align 2
.type fuse_sigmoid,@function
fuse_sigmoid: # @fuse_sigmoid
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -32
.cfi_def_cfa_offset 32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB22_30
# %bb.1: # %assert_end
lwu a4, 4(a1)
ld a2, 8(a0)
lwu a3, 0(a1)
ld a5, 0(a0)
ld t0, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB22_3
# %bb.2: # %if_then
lw a0, 0(a0)
addi s0, zero, 1
bne a0, s0, .LBB22_31
.LBB22_3: # %if_end
ld a7, 24(a2)
ld a0, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld s0, 32(a2)
beqz s0, .LBB22_5
# %bb.4: # %if_then3
lw s0, 0(s0)
addi s1, zero, 1
bne s0, s1, .LBB22_32
.LBB22_5: # %if_end4
addi s1, zero, 13
bltu s1, a3, .LBB22_25
# %bb.6: # %if_end4
addi s1, zero, 1
sll a3, s1, a3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB22_25
# %bb.7: # %assert_end8
addi a3, zero, 13
bltu a3, a4, .LBB22_26
# %bb.8: # %assert_end8
addi a3, zero, 1
sll a4, a3, a4
lui s1, 2
addiw s1, s1, 152
and a4, a4, s1
beqz a4, .LBB22_26
# %bb.9: # %assert_end10
bne t1, a3, .LBB22_33
# %bb.10: # %assert_end12
lw a3, 16(a5)
addi s0, zero, 1
bne a3, s0, .LBB22_34
# %bb.11: # %assert_end14
lhu a3, 22(a5)
bne a3, s0, .LBB22_35
# %bb.12: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB22_35
# %bb.13: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB22_35
# %bb.14: # %assert_end16
lw a3, 0(t0)
addi a4, zero, 100
bne a3, a4, .LBB22_36
# %bb.15: # %assert_end18
ld a3, 40(a5)
bnez a3, .LBB22_37
# %bb.16: # %assert_end20
lw a3, 16(a2)
addi s0, zero, 1
bne a3, s0, .LBB22_38
# %bb.17: # %assert_end22
lhu a3, 22(a2)
bne a3, s0, .LBB22_39
# %bb.18: # %assert_end22
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB22_39
# %bb.19: # %assert_end22
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB22_39
# %bb.20: # %assert_end24
lw a3, 0(a7)
addi a4, zero, 100
bne a3, a4, .LBB22_40
# %bb.21: # %assert_end26
ld a3, 40(a2)
bnez a3, .LBB22_41
# %bb.22: # %assert_end28
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB22_42
# %bb.23: # %assert_end30
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB22_44
# %bb.24: # %assert_end32
call fuse_sigmoid_compute_
mv a0, zero
j .LBB22_29
.LBB22_25: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.137)
addi a0, a0, %lo(.L.str.137)
j .LBB22_27
.LBB22_26: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.138)
addi a0, a0, %lo(.L.str.138)
.LBB22_27: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB22_28: # %assert_fail1
addi a0, a0, -1
.LBB22_29: # %assert_fail1
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
addi sp, sp, 32
.cfi_def_cfa_offset 0
ret
.LBB22_30: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.136)
addi a0, a0, %lo(.L.str.136)
j .LBB22_27
.LBB22_31: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.52)
addi a0, a0, %lo(.L.str.52)
j .LBB22_43
.LBB22_32: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.53)
addi a0, a0, %lo(.L.str.53)
jalr a1
slli a0, s1, 32
j .LBB22_28
.LBB22_33: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB22_27
.LBB22_34: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.56)
addi a0, a0, %lo(.L.str.56)
j .LBB22_43
.LBB22_35: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB22_27
.LBB22_36: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.133)
addi a0, a0, %lo(.L.str.133)
j .LBB22_27
.LBB22_37: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB22_27
.LBB22_38: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.58)
addi a0, a0, %lo(.L.str.58)
j .LBB22_43
.LBB22_39: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB22_27
.LBB22_40: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.134)
addi a0, a0, %lo(.L.str.134)
j .LBB22_27
.LBB22_41: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB22_27
.LBB22_42: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB22_43: # %assert_fail1
jalr a1
slli a0, s0, 32
j .LBB22_28
.LBB22_44: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB22_27
.Lfunc_end22:
.size fuse_sigmoid, .Lfunc_end22-fuse_sigmoid
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_sigmoid_compute_
.LCPI23_0:
.word 0 # float 0
.LCPI23_1:
.word 1065353216 # float 1
.text
.globl fuse_sigmoid_compute_
.p2align 2
.type fuse_sigmoid_compute_,@function
fuse_sigmoid_compute_: # @fuse_sigmoid_compute_
# %bb.0: # %entry
addi sp, sp, -48
sd ra, 40(sp)
sd s0, 32(sp)
sd s1, 24(sp)
sd s2, 16(sp)
sd s3, 8(sp)
mv s3, a1
mv s1, a0
lui a0, %hi(.LCPI23_0)
addi a0, a0, %lo(.LCPI23_0)
flw ft0, 0(a0)
fsw ft0, 4(sp)
lui a0, %hi(.LCPI23_1)
addi a0, a0, %lo(.LCPI23_1)
flw ft0, 0(a0)
fsw ft0, 0(sp)
addi s2, zero, 400
mv s0, zero
.LBB23_1: # %for_body
# =>This Inner Loop Header: Depth=1
add a0, s3, s0
flw ft0, 0(a0)
flw ft1, 4(sp)
fsub.s ft0, ft1, ft0
fmv.x.w a0, ft0
call expf
fmv.w.x ft0, a0
flw ft1, 0(sp)
fadd.s ft0, ft0, ft1
fdiv.s ft0, ft1, ft0
add a0, s1, s0
fsw ft0, 0(a0)
addi s0, s0, 4
bne s0, s2, .LBB23_1
# %bb.2: # %for_end
ld s3, 8(sp)
ld s2, 16(sp)
ld s1, 24(sp)
ld s0, 32(sp)
ld ra, 40(sp)
addi sp, sp, 48
ret
.Lfunc_end23:
.size fuse_sigmoid_compute_, .Lfunc_end23-fuse_sigmoid_compute_
# -- End function
.globl fuse_matmul_1 # -- Begin function fuse_matmul_1
.p2align 2
.type fuse_matmul_1,@function
fuse_matmul_1: # @fuse_matmul_1
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -32
.cfi_def_cfa_offset 32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 3
bne a2, a3, .LBB24_49
# %bb.1: # %assert_end
lwu t2, 8(a1)
ld t5, 16(a0)
lwu t3, 4(a1)
ld a4, 8(a0)
lwu t6, 0(a1)
ld a5, 0(a0)
ld t1, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB24_4
# %bb.2: # %if_then
lw a2, 0(a0)
addi s0, zero, 100
bne a2, s0, .LBB24_50
# %bb.3: # %if_then
ld a0, 8(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a2, zero, 1
bne a0, a2, .LBB24_50
.LBB24_4: # %if_end
ld t0, 24(a4)
ld a2, 0(a4)
lwu a6, 12(a5)
lwu t4, 8(a5)
ld a0, 32(a4)
beqz a0, .LBB24_7
# %bb.5: # %if_then3
lw s0, 0(a0)
addi a3, zero, 10
bne s0, a3, .LBB24_51
# %bb.6: # %if_then3
ld a0, 8(a0)
slli a0, a0, 32
srli a0, a0, 32
addi a3, zero, 1
bne a0, a3, .LBB24_51
.LBB24_7: # %if_end4
ld a7, 24(t5)
ld a0, 0(t5)
ld s0, 32(t5)
beqz s0, .LBB24_10
# %bb.8: # %if_then7
lw a3, 0(s0)
addi s1, zero, 10
bne a3, s1, .LBB24_52
# %bb.9: # %if_then7
ld a3, 8(s0)
slli a3, a3, 32
srli a3, a3, 32
addi s0, zero, 1
bne a3, s0, .LBB24_52
.LBB24_10: # %if_end8
addi a3, zero, 13
bltu a3, t6, .LBB24_43
# %bb.11: # %if_end8
addi a3, zero, 1
sll a3, a3, t6
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB24_43
# %bb.12: # %assert_end12
addi a3, zero, 13
bltu a3, t3, .LBB24_44
# %bb.13: # %assert_end12
addi a3, zero, 1
sll a3, a3, t3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB24_44
# %bb.14: # %assert_end14
addi a3, zero, 13
bltu a3, t2, .LBB24_45
# %bb.15: # %assert_end14
addi a3, zero, 1
sll s1, a3, t2
lui s0, 2
addiw s0, s0, 152
and s1, s1, s0
beqz s1, .LBB24_45
# %bb.16: # %assert_end16
bne t4, a3, .LBB24_53
# %bb.17: # %assert_end18
lw a3, 16(a5)
addi s1, zero, 2
bne a3, s1, .LBB24_54
# %bb.18: # %assert_end20
lhu a3, 22(a5)
addi s0, zero, 1
bne a3, s0, .LBB24_55
# %bb.19: # %assert_end20
lbu a3, 21(a5)
addi s1, zero, 32
bne a3, s1, .LBB24_55
# %bb.20: # %assert_end20
lbu a3, 20(a5)
addi s1, zero, 2
bne a3, s1, .LBB24_55
# %bb.21: # %assert_end22
lw a3, 0(t1)
addi s0, zero, 1
bne a3, s0, .LBB24_56
# %bb.22: # %assert_end24
lw a3, 8(t1)
addi s1, zero, 100
bne a3, s1, .LBB24_57
# %bb.23: # %assert_end26
ld a3, 40(a5)
bnez a3, .LBB24_58
# %bb.24: # %assert_end28
lw a3, 16(a4)
addi a5, zero, 2
bne a3, a5, .LBB24_59
# %bb.25: # %assert_end30
lhu a3, 22(a4)
addi s0, zero, 1
bne a3, s0, .LBB24_60
# %bb.26: # %assert_end30
lbu a3, 21(a4)
addi a5, zero, 32
bne a3, a5, .LBB24_60
# %bb.27: # %assert_end30
lbu a3, 20(a4)
addi a5, zero, 2
bne a3, a5, .LBB24_60
# %bb.28: # %assert_end32
lw a3, 0(t0)
addi a5, zero, 100
bne a3, a5, .LBB24_61
# %bb.29: # %assert_end34
lw a3, 8(t0)
addi a5, zero, 10
bne a3, a5, .LBB24_62
# %bb.30: # %assert_end36
ld a3, 40(a4)
bnez a3, .LBB24_63
# %bb.31: # %assert_end38
lw a3, 8(a4)
addi s0, zero, 1
bne a3, s0, .LBB24_64
# %bb.32: # %assert_end40
lw a4, 12(a4)
sext.w a3, a6
bne a3, a4, .LBB24_65
# %bb.33: # %assert_end42
lw a4, 16(t5)
addi a5, zero, 2
bne a4, a5, .LBB24_66
# %bb.34: # %assert_end44
lhu a4, 22(t5)
addi s0, zero, 1
bne a4, s0, .LBB24_67
# %bb.35: # %assert_end44
lbu a4, 21(t5)
addi a5, zero, 32
bne a4, a5, .LBB24_67
# %bb.36: # %assert_end44
lbu a4, 20(t5)
addi a5, zero, 2
bne a4, a5, .LBB24_67
# %bb.37: # %assert_end46
lw a4, 0(a7)
addi s0, zero, 1
bne a4, s0, .LBB24_68
# %bb.38: # %assert_end48
lw a4, 8(a7)
addi a5, zero, 10
bne a4, a5, .LBB24_69
# %bb.39: # %assert_end50
ld a4, 40(t5)
bnez a4, .LBB24_70
# %bb.40: # %assert_end52
lw a4, 8(t5)
addi s0, zero, 1
bne a4, s0, .LBB24_71
# %bb.41: # %assert_end54
lw a4, 12(t5)
bne a3, a4, .LBB24_73
# %bb.42: # %assert_end56
call fuse_matmul_1_compute_
mv a0, zero
j .LBB24_48
.LBB24_43: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.143)
addi a0, a0, %lo(.L.str.143)
j .LBB24_46
.LBB24_44: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.144)
addi a0, a0, %lo(.L.str.144)
j .LBB24_46
.LBB24_45: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.145)
addi a0, a0, %lo(.L.str.145)
.LBB24_46: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB24_47: # %assert_fail21
addi a0, a0, -1
.LBB24_48: # %assert_fail21
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
addi sp, sp, 32
.cfi_def_cfa_offset 0
ret
.LBB24_49: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.139)
addi a0, a0, %lo(.L.str.139)
j .LBB24_46
.LBB24_50: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.140)
addi a0, a0, %lo(.L.str.140)
j .LBB24_46
.LBB24_51: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.141)
addi a0, a0, %lo(.L.str.141)
j .LBB24_46
.LBB24_52: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.142)
addi a0, a0, %lo(.L.str.142)
j .LBB24_46
.LBB24_53: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB24_46
.LBB24_54: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.6)
addi a0, a0, %lo(.L.str.6)
j .LBB24_46
.LBB24_55: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB24_72
.LBB24_56: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB24_72
.LBB24_57: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.146)
addi a0, a0, %lo(.L.str.146)
j .LBB24_46
.LBB24_58: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB24_46
.LBB24_59: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.114)
addi a0, a0, %lo(.L.str.114)
j .LBB24_46
.LBB24_60: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB24_72
.LBB24_61: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.134)
addi a0, a0, %lo(.L.str.134)
j .LBB24_46
.LBB24_62: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.147)
addi a0, a0, %lo(.L.str.147)
j .LBB24_46
.LBB24_63: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB24_46
.LBB24_64: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
j .LBB24_72
.LBB24_65: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB24_46
.LBB24_66: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.126)
addi a0, a0, %lo(.L.str.126)
j .LBB24_46
.LBB24_67: # %assert_fail45
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.37)
addi a0, a0, %lo(.L.str.37)
j .LBB24_72
.LBB24_68: # %assert_fail47
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.127)
addi a0, a0, %lo(.L.str.127)
j .LBB24_72
.LBB24_69: # %assert_fail49
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.148)
addi a0, a0, %lo(.L.str.148)
j .LBB24_46
.LBB24_70: # %assert_fail51
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.39)
addi a0, a0, %lo(.L.str.39)
j .LBB24_46
.LBB24_71: # %assert_fail53
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.40)
addi a0, a0, %lo(.L.str.40)
.LBB24_72: # %assert_fail21
jalr a1
slli a0, s0, 32
j .LBB24_47
.LBB24_73: # %assert_fail55
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.41)
addi a0, a0, %lo(.L.str.41)
j .LBB24_46
.Lfunc_end24:
.size fuse_matmul_1, .Lfunc_end24-fuse_matmul_1
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_matmul_1_compute_
.LCPI25_0:
.word 0 # float 0
.text
.globl fuse_matmul_1_compute_
.p2align 2
.type fuse_matmul_1_compute_,@function
fuse_matmul_1_compute_: # @fuse_matmul_1_compute_
# %bb.0: # %entry
sw zero, 0(a0)
lui a3, %hi(.LCPI25_0)
addi a3, a3, %lo(.LCPI25_0)
flw ft0, 0(a3)
addi a6, zero, 400
mv a4, a2
mv a5, zero
.LBB25_1: # %for_body2
# =>This Inner Loop Header: Depth=1
add a3, a1, a5
flw ft1, 0(a3)
flw ft2, 0(a4)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a4, a4, 40
addi a5, a5, 4
bne a5, a6, .LBB25_1
# %bb.2: # %for_end3
fsw ft0, 0(a0)
sw zero, 4(a0)
addi a3, a2, 4
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_3: # %for_body2.1
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_3
# %bb.4: # %for_end3.1
fsw ft0, 4(a0)
sw zero, 8(a0)
addi a3, a2, 8
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_5: # %for_body2.2
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_5
# %bb.6: # %for_end3.2
fsw ft0, 8(a0)
sw zero, 12(a0)
addi a3, a2, 12
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_7: # %for_body2.3
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_7
# %bb.8: # %for_end3.3
fsw ft0, 12(a0)
sw zero, 16(a0)
addi a3, a2, 16
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_9: # %for_body2.4
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_9
# %bb.10: # %for_end3.4
fsw ft0, 16(a0)
sw zero, 20(a0)
addi a3, a2, 20
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_11: # %for_body2.5
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_11
# %bb.12: # %for_end3.5
fsw ft0, 20(a0)
sw zero, 24(a0)
addi a3, a2, 24
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_13: # %for_body2.6
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_13
# %bb.14: # %for_end3.6
fsw ft0, 24(a0)
sw zero, 28(a0)
addi a3, a2, 28
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_15: # %for_body2.7
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_15
# %bb.16: # %for_end3.7
fsw ft0, 28(a0)
sw zero, 32(a0)
addi a3, a2, 32
lui a4, %hi(.LCPI25_0)
addi a4, a4, %lo(.LCPI25_0)
flw ft0, 0(a4)
addi a6, zero, 400
mv a5, zero
.LBB25_17: # %for_body2.8
# =>This Inner Loop Header: Depth=1
add a4, a1, a5
flw ft1, 0(a4)
flw ft2, 0(a3)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a3, a3, 40
addi a5, a5, 4
bne a5, a6, .LBB25_17
# %bb.18: # %for_end3.8
fsw ft0, 32(a0)
sw zero, 36(a0)
addi a2, a2, 36
lui a3, %hi(.LCPI25_0)
addi a3, a3, %lo(.LCPI25_0)
flw ft0, 0(a3)
addi a3, zero, 400
mv a4, zero
.LBB25_19: # %for_body2.9
# =>This Inner Loop Header: Depth=1
add a5, a1, a4
flw ft1, 0(a5)
flw ft2, 0(a2)
fmul.s ft1, ft1, ft2
fadd.s ft0, ft1, ft0
addi a2, a2, 40
addi a4, a4, 4
bne a4, a3, .LBB25_19
# %bb.20: # %for_end3.9
fsw ft0, 36(a0)
ret
.Lfunc_end25:
.size fuse_matmul_1_compute_, .Lfunc_end25-fuse_matmul_1_compute_
# -- End function
.globl fuse_elemwise_add_1 # -- Begin function fuse_elemwise_add_1
.p2align 2
.type fuse_elemwise_add_1,@function
fuse_elemwise_add_1: # @fuse_elemwise_add_1
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -32
.cfi_def_cfa_offset 32
sd ra, 24(sp)
sd s0, 16(sp)
sd s1, 8(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
.cfi_offset s1, -24
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 3
bne a2, a3, .LBB26_43
# %bb.1: # %assert_end
lwu t2, 8(a1)
ld t5, 16(a0)
lwu t3, 4(a1)
ld a4, 8(a0)
lwu a3, 0(a1)
ld a5, 0(a0)
ld t1, 24(a5)
ld a1, 0(a5)
ld a0, 32(a5)
beqz a0, .LBB26_3
# %bb.2: # %if_then
lw a0, 0(a0)
addi s0, zero, 1
bne a0, s0, .LBB26_44
.LBB26_3: # %if_end
ld t0, 24(a4)
ld a2, 0(a4)
lwu a7, 12(a5)
lwu t4, 8(a5)
ld a0, 32(a4)
beqz a0, .LBB26_5
# %bb.4: # %if_then3
lw a0, 0(a0)
addi s0, zero, 1
bne a0, s0, .LBB26_45
.LBB26_5: # %if_end4
ld a6, 24(t5)
ld a0, 0(t5)
ld s0, 32(t5)
beqz s0, .LBB26_7
# %bb.6: # %if_then7
lw s0, 0(s0)
addi s1, zero, 1
bne s0, s1, .LBB26_46
.LBB26_7: # %if_end8
addi s1, zero, 13
bltu s1, a3, .LBB26_37
# %bb.8: # %if_end8
addi s1, zero, 1
sll a3, s1, a3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB26_37
# %bb.9: # %assert_end12
addi a3, zero, 13
bltu a3, t3, .LBB26_38
# %bb.10: # %assert_end12
addi a3, zero, 1
sll a3, a3, t3
lui s1, 2
addiw s1, s1, 152
and a3, a3, s1
beqz a3, .LBB26_38
# %bb.11: # %assert_end14
addi a3, zero, 13
bltu a3, t2, .LBB26_39
# %bb.12: # %assert_end14
addi a3, zero, 1
sll s1, a3, t2
lui s0, 2
addiw s0, s0, 152
and s1, s1, s0
beqz s1, .LBB26_39
# %bb.13: # %assert_end16
bne t4, a3, .LBB26_47
# %bb.14: # %assert_end18
lw a3, 16(a5)
addi s0, zero, 1
bne a3, s0, .LBB26_48
# %bb.15: # %assert_end20
lhu a3, 22(a5)
bne a3, s0, .LBB26_49
# %bb.16: # %assert_end20
lbu a3, 21(a5)
addi s1, zero, 32
bne a3, s1, .LBB26_49
# %bb.17: # %assert_end20
lbu a3, 20(a5)
addi s1, zero, 2
bne a3, s1, .LBB26_49
# %bb.18: # %assert_end22
lw a3, 0(t1)
addi s1, zero, 10
bne a3, s1, .LBB26_50
# %bb.19: # %assert_end24
ld a3, 40(a5)
bnez a3, .LBB26_51
# %bb.20: # %assert_end26
lw a3, 16(a4)
addi s0, zero, 1
bne a3, s0, .LBB26_52
# %bb.21: # %assert_end28
lhu a3, 22(a4)
bne a3, s0, .LBB26_53
# %bb.22: # %assert_end28
lbu a3, 21(a4)
addi a5, zero, 32
bne a3, a5, .LBB26_53
# %bb.23: # %assert_end28
lbu a3, 20(a4)
addi a5, zero, 2
bne a3, a5, .LBB26_53
# %bb.24: # %assert_end30
lw a3, 0(t0)
addi a5, zero, 10
bne a3, a5, .LBB26_54
# %bb.25: # %assert_end32
ld a3, 40(a4)
bnez a3, .LBB26_55
# %bb.26: # %assert_end34
lw a3, 8(a4)
addi s0, zero, 1
bne a3, s0, .LBB26_56
# %bb.27: # %assert_end36
lw a4, 12(a4)
sext.w a3, a7
bne a3, a4, .LBB26_57
# %bb.28: # %assert_end38
lw a4, 16(t5)
addi s0, zero, 1
bne a4, s0, .LBB26_58
# %bb.29: # %assert_end40
lhu a4, 22(t5)
bne a4, s0, .LBB26_59
# %bb.30: # %assert_end40
lbu a4, 21(t5)
addi a5, zero, 32
bne a4, a5, .LBB26_59
# %bb.31: # %assert_end40
lbu a4, 20(t5)
addi a5, zero, 2
bne a4, a5, .LBB26_59
# %bb.32: # %assert_end42
lw a4, 0(a6)
addi a5, zero, 10
bne a4, a5, .LBB26_60
# %bb.33: # %assert_end44
ld a4, 40(t5)
bnez a4, .LBB26_61
# %bb.34: # %assert_end46
lw a4, 8(t5)
addi s0, zero, 1
bne a4, s0, .LBB26_62
# %bb.35: # %assert_end48
lw a4, 12(t5)
bne a3, a4, .LBB26_64
# %bb.36: # %assert_end50
call fuse_elemwise_add_1_compute_
mv a0, zero
j .LBB26_42
.LBB26_37: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.150)
addi a0, a0, %lo(.L.str.150)
j .LBB26_40
.LBB26_38: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.151)
addi a0, a0, %lo(.L.str.151)
j .LBB26_40
.LBB26_39: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.152)
addi a0, a0, %lo(.L.str.152)
.LBB26_40: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB26_41: # %assert_fail1
addi a0, a0, -1
.LBB26_42: # %assert_fail1
ld s1, 8(sp)
ld s0, 16(sp)
ld ra, 24(sp)
.cfi_restore ra
.cfi_restore s0
.cfi_restore s1
addi sp, sp, 32
.cfi_def_cfa_offset 0
ret
.LBB26_43: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.149)
addi a0, a0, %lo(.L.str.149)
j .LBB26_40
.LBB26_44: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.52)
addi a0, a0, %lo(.L.str.52)
j .LBB26_63
.LBB26_45: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.53)
addi a0, a0, %lo(.L.str.53)
j .LBB26_63
.LBB26_46: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.23)
addi a0, a0, %lo(.L.str.23)
jalr a1
slli a0, s1, 32
j .LBB26_41
.LBB26_47: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB26_40
.LBB26_48: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.56)
addi a0, a0, %lo(.L.str.56)
j .LBB26_63
.LBB26_49: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB26_40
.LBB26_50: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.153)
addi a0, a0, %lo(.L.str.153)
j .LBB26_40
.LBB26_51: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB26_40
.LBB26_52: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.58)
addi a0, a0, %lo(.L.str.58)
j .LBB26_63
.LBB26_53: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB26_40
.LBB26_54: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.154)
addi a0, a0, %lo(.L.str.154)
j .LBB26_40
.LBB26_55: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB26_40
.LBB26_56: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
j .LBB26_63
.LBB26_57: # %assert_fail37
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB26_40
.LBB26_58: # %assert_fail39
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.36)
addi a0, a0, %lo(.L.str.36)
j .LBB26_63
.LBB26_59: # %assert_fail41
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.37)
addi a0, a0, %lo(.L.str.37)
j .LBB26_40
.LBB26_60: # %assert_fail43
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.155)
addi a0, a0, %lo(.L.str.155)
j .LBB26_40
.LBB26_61: # %assert_fail45
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.39)
addi a0, a0, %lo(.L.str.39)
j .LBB26_40
.LBB26_62: # %assert_fail47
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.40)
addi a0, a0, %lo(.L.str.40)
.LBB26_63: # %assert_fail1
jalr a1
slli a0, s0, 32
j .LBB26_41
.LBB26_64: # %assert_fail49
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.41)
addi a0, a0, %lo(.L.str.41)
j .LBB26_40
.Lfunc_end26:
.size fuse_elemwise_add_1, .Lfunc_end26-fuse_elemwise_add_1
.cfi_endproc
# -- End function
.globl fuse_elemwise_add_1_compute_ # -- Begin function fuse_elemwise_add_1_compute_
.p2align 2
.type fuse_elemwise_add_1_compute_,@function
fuse_elemwise_add_1_compute_: # @fuse_elemwise_add_1_compute_
# %bb.0: # %entry
flw ft0, 0(a1)
flw ft1, 0(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 0(a0)
flw ft0, 4(a1)
flw ft1, 4(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 4(a0)
flw ft0, 8(a1)
flw ft1, 8(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 8(a0)
flw ft0, 12(a1)
flw ft1, 12(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 12(a0)
flw ft0, 16(a1)
flw ft1, 16(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 16(a0)
flw ft0, 20(a1)
flw ft1, 20(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 20(a0)
flw ft0, 24(a1)
flw ft1, 24(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 24(a0)
flw ft0, 28(a1)
flw ft1, 28(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 28(a0)
flw ft0, 32(a1)
flw ft1, 32(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 32(a0)
flw ft0, 36(a1)
flw ft1, 36(a2)
fadd.s ft0, ft1, ft0
fsw ft0, 36(a0)
ret
.Lfunc_end27:
.size fuse_elemwise_add_1_compute_, .Lfunc_end27-fuse_elemwise_add_1_compute_
# -- End function
.globl fuse_softmax # -- Begin function fuse_softmax
.p2align 2
.type fuse_softmax,@function
fuse_softmax: # @fuse_softmax
.cfi_startproc
# %bb.0: # %entry
addi sp, sp, -16
.cfi_def_cfa_offset 16
sd ra, 8(sp)
sd s0, 0(sp)
.cfi_offset ra, -8
.cfi_offset s0, -16
slli a2, a2, 32
srli a2, a2, 32
addi a3, zero, 2
bne a2, a3, .LBB28_34
# %bb.1: # %assert_end
lwu t2, 4(a1)
ld a2, 8(a0)
lwu t3, 0(a1)
ld a5, 0(a0)
ld t0, 24(a5)
ld a0, 0(a5)
ld a1, 32(a5)
beqz a1, .LBB28_4
# %bb.2: # %if_then
lw s0, 0(a1)
addi a4, zero, 10
bne s0, a4, .LBB28_35
# %bb.3: # %if_then
ld a1, 8(a1)
slli a1, a1, 32
srli a1, a1, 32
addi a4, zero, 1
bne a1, a4, .LBB28_35
.LBB28_4: # %if_end
ld a7, 24(a2)
ld a1, 0(a2)
lwu a6, 12(a5)
lwu t1, 8(a5)
ld s0, 32(a2)
beqz s0, .LBB28_7
# %bb.5: # %if_then3
lw a4, 0(s0)
addi a3, zero, 10
bne a4, a3, .LBB28_36
# %bb.6: # %if_then3
ld a3, 8(s0)
slli a3, a3, 32
srli a3, a3, 32
addi a4, zero, 1
bne a3, a4, .LBB28_36
.LBB28_7: # %if_end4
addi a3, zero, 13
bltu a3, t3, .LBB28_29
# %bb.8: # %if_end4
addi a3, zero, 1
sll a3, a3, t3
lui a4, 2
addiw a4, a4, 152
and a3, a3, a4
beqz a3, .LBB28_29
# %bb.9: # %assert_end8
addi a3, zero, 13
bltu a3, t2, .LBB28_30
# %bb.10: # %assert_end8
addi a3, zero, 1
sll a4, a3, t2
lui s0, 2
addiw s0, s0, 152
and a4, a4, s0
beqz a4, .LBB28_30
# %bb.11: # %assert_end10
bne t1, a3, .LBB28_37
# %bb.12: # %assert_end12
lw a3, 16(a5)
addi a4, zero, 2
bne a3, a4, .LBB28_38
# %bb.13: # %assert_end14
lhu a3, 22(a5)
addi s0, zero, 1
bne a3, s0, .LBB28_39
# %bb.14: # %assert_end14
lbu a3, 21(a5)
addi a4, zero, 32
bne a3, a4, .LBB28_39
# %bb.15: # %assert_end14
lbu a3, 20(a5)
addi a4, zero, 2
bne a3, a4, .LBB28_39
# %bb.16: # %assert_end16
lw a3, 0(t0)
addi s0, zero, 1
bne a3, s0, .LBB28_40
# %bb.17: # %assert_end18
lw a3, 8(t0)
addi a4, zero, 10
bne a3, a4, .LBB28_41
# %bb.18: # %assert_end20
ld a3, 40(a5)
bnez a3, .LBB28_42
# %bb.19: # %assert_end22
lw a3, 16(a2)
addi a4, zero, 2
bne a3, a4, .LBB28_43
# %bb.20: # %assert_end24
lhu a3, 22(a2)
addi s0, zero, 1
bne a3, s0, .LBB28_44
# %bb.21: # %assert_end24
lbu a3, 21(a2)
addi a4, zero, 32
bne a3, a4, .LBB28_44
# %bb.22: # %assert_end24
lbu a3, 20(a2)
addi a4, zero, 2
bne a3, a4, .LBB28_44
# %bb.23: # %assert_end26
lw a3, 0(a7)
addi s0, zero, 1
bne a3, s0, .LBB28_45
# %bb.24: # %assert_end28
lw a3, 8(a7)
addi a4, zero, 10
bne a3, a4, .LBB28_46
# %bb.25: # %assert_end30
ld a3, 40(a2)
bnez a3, .LBB28_47
# %bb.26: # %assert_end32
lw a3, 8(a2)
addi s0, zero, 1
bne a3, s0, .LBB28_48
# %bb.27: # %assert_end34
lw a2, 12(a2)
sext.w a3, a6
bne a3, a2, .LBB28_50
# %bb.28: # %assert_end36
call fuse_softmax_compute_
mv a0, zero
j .LBB28_33
.LBB28_29: # %assert_fail7
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.158)
addi a0, a0, %lo(.L.str.158)
j .LBB28_31
.LBB28_30: # %assert_fail9
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.159)
addi a0, a0, %lo(.L.str.159)
.LBB28_31: # %assert_fail
jalr a1
addi a0, zero, 1
slli a0, a0, 32
.LBB28_32: # %assert_fail15
addi a0, a0, -1
.LBB28_33: # %assert_fail15
ld s0, 0(sp)
ld ra, 8(sp)
.cfi_restore ra
.cfi_restore s0
addi sp, sp, 16
.cfi_def_cfa_offset 0
ret
.LBB28_34: # %assert_fail
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.156)
addi a0, a0, %lo(.L.str.156)
j .LBB28_31
.LBB28_35: # %assert_fail1
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.157)
addi a0, a0, %lo(.L.str.157)
j .LBB28_31
.LBB28_36: # %assert_fail5
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.141)
addi a0, a0, %lo(.L.str.141)
j .LBB28_31
.LBB28_37: # %assert_fail11
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.5)
addi a0, a0, %lo(.L.str.5)
j .LBB28_31
.LBB28_38: # %assert_fail13
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.6)
addi a0, a0, %lo(.L.str.6)
j .LBB28_31
.LBB28_39: # %assert_fail15
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.7)
addi a0, a0, %lo(.L.str.7)
j .LBB28_49
.LBB28_40: # %assert_fail17
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.8)
addi a0, a0, %lo(.L.str.8)
j .LBB28_49
.LBB28_41: # %assert_fail19
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.160)
addi a0, a0, %lo(.L.str.160)
j .LBB28_31
.LBB28_42: # %assert_fail21
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.10)
addi a0, a0, %lo(.L.str.10)
j .LBB28_31
.LBB28_43: # %assert_fail23
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.114)
addi a0, a0, %lo(.L.str.114)
j .LBB28_31
.LBB28_44: # %assert_fail25
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.12)
addi a0, a0, %lo(.L.str.12)
j .LBB28_49
.LBB28_45: # %assert_fail27
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.13)
addi a0, a0, %lo(.L.str.13)
j .LBB28_49
.LBB28_46: # %assert_fail29
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.147)
addi a0, a0, %lo(.L.str.147)
j .LBB28_31
.LBB28_47: # %assert_fail31
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.17)
addi a0, a0, %lo(.L.str.17)
j .LBB28_31
.LBB28_48: # %assert_fail33
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.18)
addi a0, a0, %lo(.L.str.18)
.LBB28_49: # %assert_fail15
jalr a1
slli a0, s0, 32
j .LBB28_32
.LBB28_50: # %assert_fail35
lui a0, %hi(__TVMAPISetLastError)
ld a1, %lo(__TVMAPISetLastError)(a0)
lui a0, %hi(.L.str.19)
addi a0, a0, %lo(.L.str.19)
j .LBB28_31
.Lfunc_end28:
.size fuse_softmax, .Lfunc_end28-fuse_softmax
.cfi_endproc
# -- End function
.section .sdata,"aw",@progbits
.p2align 2 # -- Begin function fuse_softmax_compute_
.LCPI29_0:
.word 4286578687 # float -3.40282347E+38
.LCPI29_1:
.word 0 # float 0
.text
.globl fuse_softmax_compute_
.p2align 2
.type fuse_softmax_compute_,@function
fuse_softmax_compute_: # @fuse_softmax_compute_
# %bb.0: # %entry
addi sp, sp, -128
sd ra, 120(sp)
sd s0, 112(sp)
sd s1, 104(sp)
sd s2, 96(sp)
sd s3, 88(sp)
sd s4, 80(sp)
sd s5, 72(sp)
sd s6, 64(sp)
sd s7, 56(sp)
sd s8, 48(sp)
sd s9, 40(sp)
mv s0, a1
lui a1, %hi(.LCPI29_0)
addi a1, a1, %lo(.LCPI29_0)
flw ft1, 0(a1)
flw ft0, 0(a0)
flt.s a1, ft0, ft1
bnez a1, .LBB29_2
# %bb.1: # %entry
fmv.s ft1, ft0
.LBB29_2: # %entry
flw ft2, 4(a0)
flt.s a1, ft2, ft1
bnez a1, .LBB29_4
# %bb.3: # %entry
fmv.s ft1, ft2
.LBB29_4: # %entry
flw ft3, 8(a0)
flt.s a1, ft3, ft1
bnez a1, .LBB29_6
# %bb.5: # %entry
fmv.s ft1, ft3
.LBB29_6: # %entry
flw ft4, 12(a0)
flt.s a1, ft4, ft1
bnez a1, .LBB29_8
# %bb.7: # %entry
fmv.s ft1, ft4
.LBB29_8: # %entry
flw ft5, 16(a0)
flt.s a1, ft5, ft1
bnez a1, .LBB29_10
# %bb.9: # %entry
fmv.s ft1, ft5
.LBB29_10: # %entry
flw ft6, 20(a0)
flt.s a1, ft6, ft1
bnez a1, .LBB29_12
# %bb.11: # %entry
fmv.s ft1, ft6
.LBB29_12: # %entry
flw ft7, 24(a0)
flt.s a1, ft7, ft1
bnez a1, .LBB29_14
# %bb.13: # %entry
fmv.s ft1, ft7
.LBB29_14: # %entry
flw fa0, 28(a0)
flt.s a1, fa0, ft1
bnez a1, .LBB29_16
# %bb.15: # %entry
fmv.s ft1, fa0
.LBB29_16: # %entry
flw fa1, 32(a0)
flt.s a1, fa1, ft1
bnez a1, .LBB29_18
# %bb.17: # %entry
fmv.s ft1, fa1
.LBB29_18: # %entry
fsw fa1, 4(sp)
fsw fa0, 8(sp)
fsw ft7, 12(sp)
fsw ft6, 16(sp)
fsw ft5, 20(sp)
fsw ft4, 24(sp)
fsw ft3, 28(sp)
fsw ft2, 32(sp)
flw ft2, 36(a0)
flt.s a0, ft2, ft1
bnez a0, .LBB29_20
# %bb.19: # %entry
fmv.s ft1, ft2
.LBB29_20: # %entry
fsw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
fsw ft2, 0(sp)
call expf
mv s2, a0
flw ft0, 32(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s3, a0
flw ft0, 28(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s4, a0
flw ft0, 24(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s5, a0
flw ft0, 20(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s6, a0
flw ft0, 16(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s8, a0
flw ft0, 12(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s7, a0
flw ft0, 8(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s9, a0
flw ft0, 4(sp)
flw ft1, 36(sp)
fsub.s ft0, ft0, ft1
fmv.x.w a0, ft0
call expf
mv s1, a0
flw ft0, 36(sp)
flw ft1, 0(sp)
fsub.s ft0, ft1, ft0
lui a0, %hi(.LCPI29_1)
addi a0, a0, %lo(.LCPI29_1)
flw ft1, 0(a0)
fmv.w.x ft2, s2
fsw ft2, 36(sp)
fadd.s ft1, ft2, ft1
fmv.w.x ft2, s3
fsw ft2, 32(sp)
fadd.s ft1, ft1, ft2
fmv.w.x ft2, s4
fsw ft2, 28(sp)
fadd.s ft1, ft1, ft2
fmv.w.x ft2, s5
fsw ft2, 24(sp)
fadd.s ft1, ft1, ft2
fmv.x.w a0, ft0
fmv.w.x ft0, s6
fsw ft0, 20(sp)
fadd.s ft0, ft1, ft0
fmv.w.x ft1, s8
fsw ft1, 16(sp)
fadd.s ft0, ft0, ft1
fsw ft0, 12(sp)
call expf
fmv.w.x ft0, a0
fmv.w.x ft1, s1
fmv.w.x ft2, s9
fmv.w.x ft3, s7
flw ft4, 12(sp)
fadd.s ft4, ft4, ft3
fadd.s ft4, ft4, ft2
fadd.s ft4, ft4, ft1
fadd.s ft4, ft4, ft0
fdiv.s ft0, ft0, ft4
fsw ft0, 36(s0)
fdiv.s ft0, ft1, ft4
fsw ft0, 32(s0)
fdiv.s ft0, ft2, ft4
fsw ft0, 28(s0)
fdiv.s ft0, ft3, ft4
fsw ft0, 24(s0)
flw ft0, 16(sp)
fdiv.s ft0, ft0, ft4
fsw ft0, 20(s0)
flw ft0, 20(sp)
fdiv.s ft0, ft0, ft4
fsw ft0, 16(s0)
flw ft0, 24(sp)
fdiv.s ft0, ft0, ft4
fsw ft0, 12(s0)
flw ft0, 28(sp)
fdiv.s ft0, ft0, ft4
fsw ft0, 8(s0)
flw ft0, 32(sp)
fdiv.s ft0, ft0, ft4
fsw ft0, 4(s0)
flw ft0, 36(sp)
fdiv.s ft0, ft0, ft4
fsw ft0, 0(s0)
ld s9, 40(sp)
ld s8, 48(sp)
ld s7, 56(sp)
ld s6, 64(sp)
ld s5, 72(sp)
ld s4, 80(sp)
ld s3, 88(sp)
ld s2, 96(sp)
ld s1, 104(sp)
ld s0, 112(sp)
ld ra, 120(sp)
addi sp, sp, 128
ret
.Lfunc_end29:
.size fuse_softmax_compute_, .Lfunc_end29-fuse_softmax_compute_
# -- End function
.type __TVMAPISetLastError,@object # @__TVMAPISetLastError
.section .sbss,"aw",@nobits
.weak __TVMAPISetLastError
.p2align 3
__TVMAPISetLastError:
.quad 0
.size __TVMAPISetLastError, 8
.type .L.str,@object # @.str
.section .rodata,"a",@progbits
.L.str:
.asciz "Assert fail: (num_args == 2), fuse_reshape: num_args should be 2"
.size .L.str, 65
.type .L.str.1,@object # @.str.1
.L.str.1:
.asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (784 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.1, 124
.type .L.str.2,@object # @.str.2
.L.str.2:
.asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (28 == int32(arg1.strides[2]))) && (784 == int32(arg1.strides[1]))) && (784 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.2, 197
.type .L.str.3,@object # @.str.3
.L.str.3:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_reshape: Expect arg[0] to be pointer"
.size .L.str.3, 140
.type .L.str.4,@object # @.str.4
.L.str.4:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_reshape: Expect arg[1] to be pointer"
.size .L.str.4, 140
.type .L.str.5,@object # @.str.5
.L.str.5:
.asciz "Assert fail: (dev_type == 1), device_type need to be 1"
.size .L.str.5, 55
.type .L.str.6,@object # @.str.6
.L.str.6:
.asciz "Assert fail: (2 == tvm_struct_get(arg0, 0, 4)), arg0.ndim is expected to equal 2"
.size .L.str.6, 81
.type .L.str.7,@object # @.str.7
.L.str.7:
.asciz "Assert fail: (((tvm_struct_get(arg0, 0, 5) == (uint8)2) && (tvm_struct_get(arg0, 0, 6) == (uint8)32)) && (tvm_struct_get(arg0, 0, 7) == (uint16)1)), arg0.dtype is expected to be float32"
.size .L.str.7, 186
.type .L.str.8,@object # @.str.8
.L.str.8:
.asciz "Assert fail: (int32(arg0.shape[0]) == 1), Argument arg0.shape[0] has an unsatisfied constraint"
.size .L.str.8, 95
.type .L.str.9,@object # @.str.9
.L.str.9:
.asciz "Assert fail: (int32(arg0.shape[1]) == 784), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.9, 97
.type .L.str.10,@object # @.str.10
.L.str.10:
.asciz "Assert fail: (tvm_struct_get(arg0, 0, 8) == (uint64)0), Argument arg0.byte_offset has an unsatisfied constraint"
.size .L.str.10, 112
.type .L.str.11,@object # @.str.11
.L.str.11:
.asciz "Assert fail: (4 == tvm_struct_get(arg1, 0, 4)), arg1.ndim is expected to equal 4"
.size .L.str.11, 81
.type .L.str.12,@object # @.str.12
.L.str.12:
.asciz "Assert fail: (((tvm_struct_get(arg1, 0, 5) == (uint8)2) && (tvm_struct_get(arg1, 0, 6) == (uint8)32)) && (tvm_struct_get(arg1, 0, 7) == (uint16)1)), arg1.dtype is expected to be float32"
.size .L.str.12, 186
.type .L.str.13,@object # @.str.13
.L.str.13:
.asciz "Assert fail: (int32(arg1.shape[0]) == 1), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.13, 95
.type .L.str.14,@object # @.str.14
.L.str.14:
.asciz "Assert fail: (int32(arg1.shape[1]) == 1), Argument arg1.shape[1] has an unsatisfied constraint"
.size .L.str.14, 95
.type .L.str.15,@object # @.str.15
.L.str.15:
.asciz "Assert fail: (int32(arg1.shape[2]) == 28), Argument arg1.shape[2] has an unsatisfied constraint"
.size .L.str.15, 96
.type .L.str.16,@object # @.str.16
.L.str.16:
.asciz "Assert fail: (int32(arg1.shape[3]) == 28), Argument arg1.shape[3] has an unsatisfied constraint"
.size .L.str.16, 96
.type .L.str.17,@object # @.str.17
.L.str.17:
.asciz "Assert fail: (tvm_struct_get(arg1, 0, 8) == (uint64)0), Argument arg1.byte_offset has an unsatisfied constraint"
.size .L.str.17, 112
.type .L.str.18,@object # @.str.18
.L.str.18:
.asciz "Assert fail: (1 == tvm_struct_get(arg1, 0, 10)), Argument arg1.device_type has an unsatisfied constraint"
.size .L.str.18, 105
.type .L.str.19,@object # @.str.19
.L.str.19:
.asciz "Assert fail: (dev_id == tvm_struct_get(arg1, 0, 9)), Argument arg1.device_id has an unsatisfied constraint"
.size .L.str.19, 107
.type .L.str.20,@object # @.str.20
.L.str.20:
.asciz "Assert fail: (num_args == 4), fuse_conv2d: num_args should be 4"
.size .L.str.20, 64
.type .L.str.21,@object # @.str.21
.L.str.21:
.asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (28 == int32(arg0.strides[2]))) && (784 == int32(arg0.strides[1]))) && (784 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.21, 197
.type .L.str.22,@object # @.str.22
.L.str.22:
.asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (5 == int32(arg1.strides[2]))) && (25 == int32(arg1.strides[1]))) && (25 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.22, 194
.type .L.str.23,@object # @.str.23
.L.str.23:
.asciz "Assert fail: (1 == int32(arg2.strides[0])), arg2.strides: expected to be compact array"
.size .L.str.23, 87
.type .L.str.24,@object # @.str.24
.L.str.24:
.asciz "Assert fail: ((((1 == int32(arg3.strides[3])) && (28 == int32(arg3.strides[2]))) && (784 == int32(arg3.strides[1]))) && (25088 == int32(arg3.strides[0]))), arg3.strides: expected to be compact array"
.size .L.str.24, 199
.type .L.str.25,@object # @.str.25
.L.str.25:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_conv2d: Expect arg[0] to be pointer"
.size .L.str.25, 139
.type .L.str.26,@object # @.str.26
.L.str.26:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_conv2d: Expect arg[1] to be pointer"
.size .L.str.26, 139
.type .L.str.27,@object # @.str.27
.L.str.27:
.asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_conv2d: Expect arg[2] to be pointer"
.size .L.str.27, 139
.type .L.str.28,@object # @.str.28
.L.str.28:
.asciz "Assert fail: ((((arg3.code == 3) || (arg3.code == 13)) || (arg3.code == 7)) || (arg3.code == 4)), fuse_conv2d: Expect arg[3] to be pointer"
.size .L.str.28, 139
.type .L.str.29,@object # @.str.29
.L.str.29:
.asciz "Assert fail: (4 == tvm_struct_get(arg0, 0, 4)), arg0.ndim is expected to equal 4"
.size .L.str.29, 81
.type .L.str.30,@object # @.str.30
.L.str.30:
.asciz "Assert fail: (int32(arg0.shape[1]) == 1), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.30, 95
.type .L.str.31,@object # @.str.31
.L.str.31:
.asciz "Assert fail: (int32(arg0.shape[2]) == 28), Argument arg0.shape[2] has an unsatisfied constraint"
.size .L.str.31, 96
.type .L.str.32,@object # @.str.32
.L.str.32:
.asciz "Assert fail: (int32(arg0.shape[3]) == 28), Argument arg0.shape[3] has an unsatisfied constraint"
.size .L.str.32, 96
.type .L.str.33,@object # @.str.33
.L.str.33:
.asciz "Assert fail: (int32(arg1.shape[0]) == 32), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.33, 96
.type .L.str.34,@object # @.str.34
.L.str.34:
.asciz "Assert fail: (int32(arg1.shape[2]) == 5), Argument arg1.shape[2] has an unsatisfied constraint"
.size .L.str.34, 95
.type .L.str.35,@object # @.str.35
.L.str.35:
.asciz "Assert fail: (int32(arg1.shape[3]) == 5), Argument arg1.shape[3] has an unsatisfied constraint"
.size .L.str.35, 95
.type .L.str.36,@object # @.str.36
.L.str.36:
.asciz "Assert fail: (1 == tvm_struct_get(arg2, 0, 4)), arg2.ndim is expected to equal 1"
.size .L.str.36, 81
.type .L.str.37,@object # @.str.37
.L.str.37:
.asciz "Assert fail: (((tvm_struct_get(arg2, 0, 5) == (uint8)2) && (tvm_struct_get(arg2, 0, 6) == (uint8)32)) && (tvm_struct_get(arg2, 0, 7) == (uint16)1)), arg2.dtype is expected to be float32"
.size .L.str.37, 186
.type .L.str.38,@object # @.str.38
.L.str.38:
.asciz "Assert fail: (int32(arg2.shape[0]) == 32), Argument arg2.shape[0] has an unsatisfied constraint"
.size .L.str.38, 96
.type .L.str.39,@object # @.str.39
.L.str.39:
.asciz "Assert fail: (tvm_struct_get(arg2, 0, 8) == (uint64)0), Argument arg2.byte_offset has an unsatisfied constraint"
.size .L.str.39, 112
.type .L.str.40,@object # @.str.40
.L.str.40:
.asciz "Assert fail: (1 == tvm_struct_get(arg2, 0, 10)), Argument arg2.device_type has an unsatisfied constraint"
.size .L.str.40, 105
.type .L.str.41,@object # @.str.41
.L.str.41:
.asciz "Assert fail: (dev_id == tvm_struct_get(arg2, 0, 9)), Argument arg2.device_id has an unsatisfied constraint"
.size .L.str.41, 107
.type .L.str.42,@object # @.str.42
.L.str.42:
.asciz "Assert fail: (4 == tvm_struct_get(arg3, 0, 4)), arg3.ndim is expected to equal 4"
.size .L.str.42, 81
.type .L.str.43,@object # @.str.43
.L.str.43:
.asciz "Assert fail: (((tvm_struct_get(arg3, 0, 5) == (uint8)2) && (tvm_struct_get(arg3, 0, 6) == (uint8)32)) && (tvm_struct_get(arg3, 0, 7) == (uint16)1)), arg3.dtype is expected to be float32"
.size .L.str.43, 186
.type .L.str.44,@object # @.str.44
.L.str.44:
.asciz "Assert fail: (int32(arg3.shape[0]) == 1), Argument arg3.shape[0] has an unsatisfied constraint"
.size .L.str.44, 95
.type .L.str.45,@object # @.str.45
.L.str.45:
.asciz "Assert fail: (int32(arg3.shape[1]) == 32), Argument arg3.shape[1] has an unsatisfied constraint"
.size .L.str.45, 96
.type .L.str.46,@object # @.str.46
.L.str.46:
.asciz "Assert fail: (int32(arg3.shape[2]) == 28), Argument arg3.shape[2] has an unsatisfied constraint"
.size .L.str.46, 96
.type .L.str.47,@object # @.str.47
.L.str.47:
.asciz "Assert fail: (int32(arg3.shape[3]) == 28), Argument arg3.shape[3] has an unsatisfied constraint"
.size .L.str.47, 96
.type .L.str.48,@object # @.str.48
.L.str.48:
.asciz "Assert fail: (tvm_struct_get(arg3, 0, 8) == (uint64)0), Argument arg3.byte_offset has an unsatisfied constraint"
.size .L.str.48, 112
.type .L.str.49,@object # @.str.49
.L.str.49:
.asciz "Assert fail: (1 == tvm_struct_get(arg3, 0, 10)), Argument arg3.device_type has an unsatisfied constraint"
.size .L.str.49, 105
.type .L.str.50,@object # @.str.50
.L.str.50:
.asciz "Assert fail: (dev_id == tvm_struct_get(arg3, 0, 9)), Argument arg3.device_id has an unsatisfied constraint"
.size .L.str.50, 107
.type __TVMBackendAllocWorkspace,@object # @__TVMBackendAllocWorkspace
.section .sbss,"aw",@nobits
.weak __TVMBackendAllocWorkspace
.p2align 3
__TVMBackendAllocWorkspace:
.quad 0
.size __TVMBackendAllocWorkspace, 8
.type __TVMBackendFreeWorkspace,@object # @__TVMBackendFreeWorkspace
.weak __TVMBackendFreeWorkspace
.p2align 3
__TVMBackendFreeWorkspace:
.quad 0
.size __TVMBackendFreeWorkspace, 8
.type .L.str.51,@object # @.str.51
.section .rodata,"a",@progbits
.L.str.51:
.asciz "Assert fail: (num_args == 2), fuse_relu: num_args should be 2"
.size .L.str.51, 62
.type .L.str.52,@object # @.str.52
.L.str.52:
.asciz "Assert fail: (1 == int32(arg0.strides[0])), arg0.strides: expected to be compact array"
.size .L.str.52, 87
.type .L.str.53,@object # @.str.53
.L.str.53:
.asciz "Assert fail: (1 == int32(arg1.strides[0])), arg1.strides: expected to be compact array"
.size .L.str.53, 87
.type .L.str.54,@object # @.str.54
.L.str.54:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_relu: Expect arg[0] to be pointer"
.size .L.str.54, 137
.type .L.str.55,@object # @.str.55
.L.str.55:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_relu: Expect arg[1] to be pointer"
.size .L.str.55, 137
.type .L.str.56,@object # @.str.56
.L.str.56:
.asciz "Assert fail: (1 == tvm_struct_get(arg0, 0, 4)), arg0.ndim is expected to equal 1"
.size .L.str.56, 81
.type .L.str.57,@object # @.str.57
.L.str.57:
.asciz "Assert fail: (int32(arg0.shape[0]) == 25088), Argument arg0.shape[0] has an unsatisfied constraint"
.size .L.str.57, 99
.type .L.str.58,@object # @.str.58
.L.str.58:
.asciz "Assert fail: (1 == tvm_struct_get(arg1, 0, 4)), arg1.ndim is expected to equal 1"
.size .L.str.58, 81
.type .L.str.59,@object # @.str.59
.L.str.59:
.asciz "Assert fail: (int32(arg1.shape[0]) == 25088), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.59, 99
.type .L.str.60,@object # @.str.60
.L.str.60:
.asciz "Assert fail: (num_args == 2), fuse_max_pool2d: num_args should be 2"
.size .L.str.60, 68
.type .L.str.61,@object # @.str.61
.L.str.61:
.asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (28 == int32(arg0.strides[2]))) && (784 == int32(arg0.strides[1]))) && (25088 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.61, 199
.type .L.str.62,@object # @.str.62
.L.str.62:
.asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (14 == int32(arg1.strides[2]))) && (196 == int32(arg1.strides[1]))) && (6272 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.62, 198
.type .L.str.63,@object # @.str.63
.L.str.63:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_max_pool2d: Expect arg[0] to be pointer"
.size .L.str.63, 143
.type .L.str.64,@object # @.str.64
.L.str.64:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_max_pool2d: Expect arg[1] to be pointer"
.size .L.str.64, 143
.type .L.str.65,@object # @.str.65
.L.str.65:
.asciz "Assert fail: (int32(arg0.shape[1]) == 32), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.65, 96
.type .L.str.66,@object # @.str.66
.L.str.66:
.asciz "Assert fail: (int32(arg1.shape[1]) == 32), Argument arg1.shape[1] has an unsatisfied constraint"
.size .L.str.66, 96
.type .L.str.67,@object # @.str.67
.L.str.67:
.asciz "Assert fail: (int32(arg1.shape[2]) == 14), Argument arg1.shape[2] has an unsatisfied constraint"
.size .L.str.67, 96
.type .L.str.68,@object # @.str.68
.L.str.68:
.asciz "Assert fail: (int32(arg1.shape[3]) == 14), Argument arg1.shape[3] has an unsatisfied constraint"
.size .L.str.68, 96
.type .L.str.69,@object # @.str.69
.L.str.69:
.asciz "Assert fail: (num_args == 4), fuse_conv2d_1: num_args should be 4"
.size .L.str.69, 66
.type .L.str.70,@object # @.str.70
.L.str.70:
.asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (14 == int32(arg0.strides[2]))) && (196 == int32(arg0.strides[1]))) && (6272 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.70, 198
.type .L.str.71,@object # @.str.71
.L.str.71:
.asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (5 == int32(arg1.strides[2]))) && (25 == int32(arg1.strides[1]))) && (800 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.71, 195
.type .L.str.72,@object # @.str.72
.L.str.72:
.asciz "Assert fail: ((((1 == int32(arg3.strides[3])) && (14 == int32(arg3.strides[2]))) && (196 == int32(arg3.strides[1]))) && (12544 == int32(arg3.strides[0]))), arg3.strides: expected to be compact array"
.size .L.str.72, 199
.type .L.str.73,@object # @.str.73
.L.str.73:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_conv2d_1: Expect arg[0] to be pointer"
.size .L.str.73, 141
.type .L.str.74,@object # @.str.74
.L.str.74:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_conv2d_1: Expect arg[1] to be pointer"
.size .L.str.74, 141
.type .L.str.75,@object # @.str.75
.L.str.75:
.asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_conv2d_1: Expect arg[2] to be pointer"
.size .L.str.75, 141
.type .L.str.76,@object # @.str.76
.L.str.76:
.asciz "Assert fail: ((((arg3.code == 3) || (arg3.code == 13)) || (arg3.code == 7)) || (arg3.code == 4)), fuse_conv2d_1: Expect arg[3] to be pointer"
.size .L.str.76, 141
.type .L.str.77,@object # @.str.77
.L.str.77:
.asciz "Assert fail: (int32(arg0.shape[2]) == 14), Argument arg0.shape[2] has an unsatisfied constraint"
.size .L.str.77, 96
.type .L.str.78,@object # @.str.78
.L.str.78:
.asciz "Assert fail: (int32(arg0.shape[3]) == 14), Argument arg0.shape[3] has an unsatisfied constraint"
.size .L.str.78, 96
.type .L.str.79,@object # @.str.79
.L.str.79:
.asciz "Assert fail: (int32(arg1.shape[0]) == 64), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.79, 96
.type .L.str.80,@object # @.str.80
.L.str.80:
.asciz "Assert fail: (int32(arg2.shape[0]) == 64), Argument arg2.shape[0] has an unsatisfied constraint"
.size .L.str.80, 96
.type .L.str.81,@object # @.str.81
.L.str.81:
.asciz "Assert fail: (int32(arg3.shape[1]) == 64), Argument arg3.shape[1] has an unsatisfied constraint"
.size .L.str.81, 96
.type .L.str.82,@object # @.str.82
.L.str.82:
.asciz "Assert fail: (int32(arg3.shape[2]) == 14), Argument arg3.shape[2] has an unsatisfied constraint"
.size .L.str.82, 96
.type .L.str.83,@object # @.str.83
.L.str.83:
.asciz "Assert fail: (int32(arg3.shape[3]) == 14), Argument arg3.shape[3] has an unsatisfied constraint"
.size .L.str.83, 96
.type .L.str.84,@object # @.str.84
.L.str.84:
.asciz "Assert fail: (num_args == 2), fuse_relu_1: num_args should be 2"
.size .L.str.84, 64
.type .L.str.85,@object # @.str.85
.L.str.85:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_relu_1: Expect arg[0] to be pointer"
.size .L.str.85, 139
.type .L.str.86,@object # @.str.86
.L.str.86:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_relu_1: Expect arg[1] to be pointer"
.size .L.str.86, 139
.type .L.str.87,@object # @.str.87
.L.str.87:
.asciz "Assert fail: (int32(arg0.shape[0]) == 12544), Argument arg0.shape[0] has an unsatisfied constraint"
.size .L.str.87, 99
.type .L.str.88,@object # @.str.88
.L.str.88:
.asciz "Assert fail: (int32(arg1.shape[0]) == 12544), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.88, 99
.type .L.str.89,@object # @.str.89
.L.str.89:
.asciz "Assert fail: (num_args == 2), fuse_max_pool2d_1: num_args should be 2"
.size .L.str.89, 70
.type .L.str.90,@object # @.str.90
.L.str.90:
.asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (14 == int32(arg0.strides[2]))) && (196 == int32(arg0.strides[1]))) && (12544 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.90, 199
.type .L.str.91,@object # @.str.91
.L.str.91:
.asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (7 == int32(arg1.strides[2]))) && (49 == int32(arg1.strides[1]))) && (3136 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.91, 196
.type .L.str.92,@object # @.str.92
.L.str.92:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_max_pool2d_1: Expect arg[0] to be pointer"
.size .L.str.92, 145
.type .L.str.93,@object # @.str.93
.L.str.93:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_max_pool2d_1: Expect arg[1] to be pointer"
.size .L.str.93, 145
.type .L.str.94,@object # @.str.94
.L.str.94:
.asciz "Assert fail: (int32(arg0.shape[1]) == 64), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.94, 96
.type .L.str.95,@object # @.str.95
.L.str.95:
.asciz "Assert fail: (int32(arg1.shape[1]) == 64), Argument arg1.shape[1] has an unsatisfied constraint"
.size .L.str.95, 96
.type .L.str.96,@object # @.str.96
.L.str.96:
.asciz "Assert fail: (int32(arg1.shape[2]) == 7), Argument arg1.shape[2] has an unsatisfied constraint"
.size .L.str.96, 95
.type .L.str.97,@object # @.str.97
.L.str.97:
.asciz "Assert fail: (int32(arg1.shape[3]) == 7), Argument arg1.shape[3] has an unsatisfied constraint"
.size .L.str.97, 95
.type .L.str.98,@object # @.str.98
.L.str.98:
.asciz "Assert fail: (num_args == 2), fuse_transpose: num_args should be 2"
.size .L.str.98, 67
.type .L.str.99,@object # @.str.99
.L.str.99:
.asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (7 == int32(arg0.strides[2]))) && (49 == int32(arg0.strides[1]))) && (3136 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.99, 196
.type .L.str.100,@object # @.str.100
.L.str.100:
.asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (64 == int32(arg1.strides[2]))) && (448 == int32(arg1.strides[1]))) && (3136 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.100, 198
.type .L.str.101,@object # @.str.101
.L.str.101:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_transpose: Expect arg[0] to be pointer"
.size .L.str.101, 142
.type .L.str.102,@object # @.str.102
.L.str.102:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_transpose: Expect arg[1] to be pointer"
.size .L.str.102, 142
.type .L.str.103,@object # @.str.103
.L.str.103:
.asciz "Assert fail: (int32(arg0.shape[2]) == 7), Argument arg0.shape[2] has an unsatisfied constraint"
.size .L.str.103, 95
.type .L.str.104,@object # @.str.104
.L.str.104:
.asciz "Assert fail: (int32(arg0.shape[3]) == 7), Argument arg0.shape[3] has an unsatisfied constraint"
.size .L.str.104, 95
.type .L.str.105,@object # @.str.105
.L.str.105:
.asciz "Assert fail: (int32(arg1.shape[1]) == 7), Argument arg1.shape[1] has an unsatisfied constraint"
.size .L.str.105, 95
.type .L.str.106,@object # @.str.106
.L.str.106:
.asciz "Assert fail: (int32(arg1.shape[3]) == 64), Argument arg1.shape[3] has an unsatisfied constraint"
.size .L.str.106, 96
.type .L.str.107,@object # @.str.107
.L.str.107:
.asciz "Assert fail: (num_args == 2), fuse_reshape_1: num_args should be 2"
.size .L.str.107, 67
.type .L.str.108,@object # @.str.108
.L.str.108:
.asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (64 == int32(arg0.strides[2]))) && (448 == int32(arg0.strides[1]))) && (3136 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.108, 198
.type .L.str.109,@object # @.str.109
.L.str.109:
.asciz "Assert fail: ((1 == int32(arg1.strides[1])) && (3136 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.109, 125
.type .L.str.110,@object # @.str.110
.L.str.110:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_reshape_1: Expect arg[0] to be pointer"
.size .L.str.110, 142
.type .L.str.111,@object # @.str.111
.L.str.111:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_reshape_1: Expect arg[1] to be pointer"
.size .L.str.111, 142
.type .L.str.112,@object # @.str.112
.L.str.112:
.asciz "Assert fail: (int32(arg0.shape[1]) == 7), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.112, 95
.type .L.str.113,@object # @.str.113
.L.str.113:
.asciz "Assert fail: (int32(arg0.shape[3]) == 64), Argument arg0.shape[3] has an unsatisfied constraint"
.size .L.str.113, 96
.type .L.str.114,@object # @.str.114
.L.str.114:
.asciz "Assert fail: (2 == tvm_struct_get(arg1, 0, 4)), arg1.ndim is expected to equal 2"
.size .L.str.114, 81
.type .L.str.115,@object # @.str.115
.L.str.115:
.asciz "Assert fail: (int32(arg1.shape[1]) == 3136), Argument arg1.shape[1] has an unsatisfied constraint"
.size .L.str.115, 98
.type .L.str.116,@object # @.str.116
.L.str.116:
.asciz "Assert fail: (num_args == 3), fuse_matmul: num_args should be 3"
.size .L.str.116, 64
.type .L.str.117,@object # @.str.117
.L.str.117:
.asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (3136 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.117, 125
.type .L.str.118,@object # @.str.118
.L.str.118:
.asciz "Assert fail: ((1 == int32(arg1.strides[1])) && (100 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.118, 124
.type .L.str.119,@object # @.str.119
.L.str.119:
.asciz "Assert fail: ((1 == int32(arg2.strides[1])) && (100 == int32(arg2.strides[0]))), arg2.strides: expected to be compact array"
.size .L.str.119, 124
.type .L.str.120,@object # @.str.120
.L.str.120:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_matmul: Expect arg[0] to be pointer"
.size .L.str.120, 139
.type .L.str.121,@object # @.str.121
.L.str.121:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_matmul: Expect arg[1] to be pointer"
.size .L.str.121, 139
.type .L.str.122,@object # @.str.122
.L.str.122:
.asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_matmul: Expect arg[2] to be pointer"
.size .L.str.122, 139
.type .L.str.123,@object # @.str.123
.L.str.123:
.asciz "Assert fail: (int32(arg0.shape[1]) == 3136), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.123, 98
.type .L.str.124,@object # @.str.124
.L.str.124:
.asciz "Assert fail: (int32(arg1.shape[0]) == 3136), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.124, 98
.type .L.str.125,@object # @.str.125
.L.str.125:
.asciz "Assert fail: (int32(arg1.shape[1]) == 100), Argument arg1.shape[1] has an unsatisfied constraint"
.size .L.str.125, 97
.type .L.str.126,@object # @.str.126
.L.str.126:
.asciz "Assert fail: (2 == tvm_struct_get(arg2, 0, 4)), arg2.ndim is expected to equal 2"
.size .L.str.126, 81
.type .L.str.127,@object # @.str.127
.L.str.127:
.asciz "Assert fail: (int32(arg2.shape[0]) == 1), Argument arg2.shape[0] has an unsatisfied constraint"
.size .L.str.127, 95
.type .L.str.128,@object # @.str.128
.L.str.128:
.asciz "Assert fail: (int32(arg2.shape[1]) == 100), Argument arg2.shape[1] has an unsatisfied constraint"
.size .L.str.128, 97
.type .L.str.129,@object # @.str.129
.L.str.129:
.asciz "Assert fail: (num_args == 3), fuse_elemwise_add: num_args should be 3"
.size .L.str.129, 70
.type .L.str.130,@object # @.str.130
.L.str.130:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_elemwise_add: Expect arg[0] to be pointer"
.size .L.str.130, 145
.type .L.str.131,@object # @.str.131
.L.str.131:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_elemwise_add: Expect arg[1] to be pointer"
.size .L.str.131, 145
.type .L.str.132,@object # @.str.132
.L.str.132:
.asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_elemwise_add: Expect arg[2] to be pointer"
.size .L.str.132, 145
.type .L.str.133,@object # @.str.133
.L.str.133:
.asciz "Assert fail: (int32(arg0.shape[0]) == 100), Argument arg0.shape[0] has an unsatisfied constraint"
.size .L.str.133, 97
.type .L.str.134,@object # @.str.134
.L.str.134:
.asciz "Assert fail: (int32(arg1.shape[0]) == 100), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.134, 97
.type .L.str.135,@object # @.str.135
.L.str.135:
.asciz "Assert fail: (int32(arg2.shape[0]) == 100), Argument arg2.shape[0] has an unsatisfied constraint"
.size .L.str.135, 97
.type .L.str.136,@object # @.str.136
.L.str.136:
.asciz "Assert fail: (num_args == 2), fuse_sigmoid: num_args should be 2"
.size .L.str.136, 65
.type .L.str.137,@object # @.str.137
.L.str.137:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_sigmoid: Expect arg[0] to be pointer"
.size .L.str.137, 140
.type .L.str.138,@object # @.str.138
.L.str.138:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_sigmoid: Expect arg[1] to be pointer"
.size .L.str.138, 140
.type .L.str.139,@object # @.str.139
.L.str.139:
.asciz "Assert fail: (num_args == 3), fuse_matmul_1: num_args should be 3"
.size .L.str.139, 66
.type .L.str.140,@object # @.str.140
.L.str.140:
.asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (100 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.140, 124
.type .L.str.141,@object # @.str.141
.L.str.141:
.asciz "Assert fail: ((1 == int32(arg1.strides[1])) && (10 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array"
.size .L.str.141, 123
.type .L.str.142,@object # @.str.142
.L.str.142:
.asciz "Assert fail: ((1 == int32(arg2.strides[1])) && (10 == int32(arg2.strides[0]))), arg2.strides: expected to be compact array"
.size .L.str.142, 123
.type .L.str.143,@object # @.str.143
.L.str.143:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_matmul_1: Expect arg[0] to be pointer"
.size .L.str.143, 141
.type .L.str.144,@object # @.str.144
.L.str.144:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_matmul_1: Expect arg[1] to be pointer"
.size .L.str.144, 141
.type .L.str.145,@object # @.str.145
.L.str.145:
.asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_matmul_1: Expect arg[2] to be pointer"
.size .L.str.145, 141
.type .L.str.146,@object # @.str.146
.L.str.146:
.asciz "Assert fail: (int32(arg0.shape[1]) == 100), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.146, 97
.type .L.str.147,@object # @.str.147
.L.str.147:
.asciz "Assert fail: (int32(arg1.shape[1]) == 10), Argument arg1.shape[1] has an unsatisfied constraint"
.size .L.str.147, 96
.type .L.str.148,@object # @.str.148
.L.str.148:
.asciz "Assert fail: (int32(arg2.shape[1]) == 10), Argument arg2.shape[1] has an unsatisfied constraint"
.size .L.str.148, 96
.type .L.str.149,@object # @.str.149
.L.str.149:
.asciz "Assert fail: (num_args == 3), fuse_elemwise_add_1: num_args should be 3"
.size .L.str.149, 72
.type .L.str.150,@object # @.str.150
.L.str.150:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_elemwise_add_1: Expect arg[0] to be pointer"
.size .L.str.150, 147
.type .L.str.151,@object # @.str.151
.L.str.151:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_elemwise_add_1: Expect arg[1] to be pointer"
.size .L.str.151, 147
.type .L.str.152,@object # @.str.152
.L.str.152:
.asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_elemwise_add_1: Expect arg[2] to be pointer"
.size .L.str.152, 147
.type .L.str.153,@object # @.str.153
.L.str.153:
.asciz "Assert fail: (int32(arg0.shape[0]) == 10), Argument arg0.shape[0] has an unsatisfied constraint"
.size .L.str.153, 96
.type .L.str.154,@object # @.str.154
.L.str.154:
.asciz "Assert fail: (int32(arg1.shape[0]) == 10), Argument arg1.shape[0] has an unsatisfied constraint"
.size .L.str.154, 96
.type .L.str.155,@object # @.str.155
.L.str.155:
.asciz "Assert fail: (int32(arg2.shape[0]) == 10), Argument arg2.shape[0] has an unsatisfied constraint"
.size .L.str.155, 96
.type .L.str.156,@object # @.str.156
.L.str.156:
.asciz "Assert fail: (num_args == 2), fuse_softmax: num_args should be 2"
.size .L.str.156, 65
.type .L.str.157,@object # @.str.157
.L.str.157:
.asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (10 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array"
.size .L.str.157, 123
.type .L.str.158,@object # @.str.158
.L.str.158:
.asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_softmax: Expect arg[0] to be pointer"
.size .L.str.158, 140
.type .L.str.159,@object # @.str.159
.L.str.159:
.asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_softmax: Expect arg[1] to be pointer"
.size .L.str.159, 140
.type .L.str.160,@object # @.str.160
.L.str.160:
.asciz "Assert fail: (int32(arg0.shape[1]) == 10), Argument arg0.shape[1] has an unsatisfied constraint"
.size .L.str.160, 96
.type __tvm_main__,@object # @__tvm_main__
.weak __tvm_main__
__tvm_main__:
.asciz "fuse_reshape"
.size __tvm_main__, 13
.section ".note.GNU-stack","",@progbits
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment