Last active
August 21, 2019 06:55
-
-
Save BeMg/342c3a3b4cdd561492a199295cb68080 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| .text | |
| .file "fuse_reshape" | |
| .globl fuse_reshape # -- Begin function fuse_reshape | |
| .p2align 2 | |
| .type fuse_reshape,@function | |
| fuse_reshape: # @fuse_reshape | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -16 | |
| .cfi_def_cfa_offset 16 | |
| sd ra, 8(sp) | |
| sd s0, 0(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB0_38 | |
| # %bb.1: # %assert_end | |
| lwu t2, 4(a1) | |
| ld a2, 8(a0) | |
| lwu t3, 0(a1) | |
| ld a5, 0(a0) | |
| ld a7, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB0_4 | |
| # %bb.2: # %if_then | |
| lw a3, 0(a0) | |
| addi s0, zero, 784 | |
| bne a3, s0, .LBB0_39 | |
| # %bb.3: # %if_then | |
| ld a0, 8(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a3, zero, 1 | |
| bne a0, a3, .LBB0_39 | |
| .LBB0_4: # %if_end | |
| ld t0, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld a3, 32(a2) | |
| beqz a3, .LBB0_9 | |
| # %bb.5: # %if_then3 | |
| lw a4, 0(a3) | |
| addi s0, zero, 784 | |
| bne a4, s0, .LBB0_40 | |
| # %bb.6: # %if_then3 | |
| ld a4, 8(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| bne a4, s0, .LBB0_40 | |
| # %bb.7: # %if_then3 | |
| ld a4, 16(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| addi s0, zero, 28 | |
| bne a4, s0, .LBB0_40 | |
| # %bb.8: # %if_then3 | |
| ld a3, 24(a3) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi a4, zero, 1 | |
| bne a3, a4, .LBB0_40 | |
| .LBB0_9: # %if_end4 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB0_33 | |
| # %bb.10: # %if_end4 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui a4, 2 | |
| addiw a4, a4, 152 | |
| and a3, a3, a4 | |
| beqz a3, .LBB0_33 | |
| # %bb.11: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t2, .LBB0_34 | |
| # %bb.12: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, t2 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a4, a4, s0 | |
| beqz a4, .LBB0_34 | |
| # %bb.13: # %assert_end10 | |
| bne t1, a3, .LBB0_41 | |
| # %bb.14: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB0_42 | |
| # %bb.15: # %assert_end14 | |
| lhu a3, 22(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB0_43 | |
| # %bb.16: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB0_43 | |
| # %bb.17: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB0_43 | |
| # %bb.18: # %assert_end16 | |
| lw a3, 0(a7) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB0_44 | |
| # %bb.19: # %assert_end18 | |
| lw a3, 8(a7) | |
| addi a4, zero, 784 | |
| bne a3, a4, .LBB0_45 | |
| # %bb.20: # %assert_end20 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB0_46 | |
| # %bb.21: # %assert_end22 | |
| lw a3, 16(a2) | |
| addi a4, zero, 4 | |
| bne a3, a4, .LBB0_47 | |
| # %bb.22: # %assert_end24 | |
| lhu a3, 22(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB0_48 | |
| # %bb.23: # %assert_end24 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB0_48 | |
| # %bb.24: # %assert_end24 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB0_48 | |
| # %bb.25: # %assert_end26 | |
| lw a3, 0(t0) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB0_49 | |
| # %bb.26: # %assert_end28 | |
| lw a3, 8(t0) | |
| bne a3, s0, .LBB0_50 | |
| # %bb.27: # %assert_end30 | |
| lw a4, 16(t0) | |
| addi a3, zero, 28 | |
| bne a4, a3, .LBB0_51 | |
| # %bb.28: # %assert_end32 | |
| lw a4, 24(t0) | |
| bne a4, a3, .LBB0_52 | |
| # %bb.29: # %assert_end34 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB0_53 | |
| # %bb.30: # %assert_end36 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB0_54 | |
| # %bb.31: # %assert_end38 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB0_56 | |
| # %bb.32: # %assert_end40 | |
| call fuse_reshape_compute_ | |
| mv a0, zero | |
| j .LBB0_37 | |
| .LBB0_33: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.3) | |
| addi a0, a0, %lo(.L.str.3) | |
| j .LBB0_35 | |
| .LBB0_34: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.4) | |
| addi a0, a0, %lo(.L.str.4) | |
| .LBB0_35: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB0_36: # %assert_fail15 | |
| addi a0, a0, -1 | |
| .LBB0_37: # %assert_fail15 | |
| ld s0, 0(sp) | |
| ld ra, 8(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| addi sp, sp, 16 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB0_38: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str) | |
| addi a0, a0, %lo(.L.str) | |
| j .LBB0_35 | |
| .LBB0_39: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.1) | |
| addi a0, a0, %lo(.L.str.1) | |
| j .LBB0_35 | |
| .LBB0_40: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.2) | |
| addi a0, a0, %lo(.L.str.2) | |
| j .LBB0_35 | |
| .LBB0_41: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB0_35 | |
| .LBB0_42: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.6) | |
| addi a0, a0, %lo(.L.str.6) | |
| j .LBB0_35 | |
| .LBB0_43: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB0_55 | |
| .LBB0_44: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB0_55 | |
| .LBB0_45: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.9) | |
| addi a0, a0, %lo(.L.str.9) | |
| j .LBB0_35 | |
| .LBB0_46: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB0_35 | |
| .LBB0_47: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.11) | |
| addi a0, a0, %lo(.L.str.11) | |
| j .LBB0_35 | |
| .LBB0_48: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB0_55 | |
| .LBB0_49: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.13) | |
| addi a0, a0, %lo(.L.str.13) | |
| j .LBB0_55 | |
| .LBB0_50: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.14) | |
| addi a0, a0, %lo(.L.str.14) | |
| j .LBB0_35 | |
| .LBB0_51: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.15) | |
| addi a0, a0, %lo(.L.str.15) | |
| j .LBB0_35 | |
| .LBB0_52: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.16) | |
| addi a0, a0, %lo(.L.str.16) | |
| j .LBB0_35 | |
| .LBB0_53: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB0_35 | |
| .LBB0_54: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB0_55: # %assert_fail15 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB0_36 | |
| .LBB0_56: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB0_35 | |
| .Lfunc_end0: | |
| .size fuse_reshape, .Lfunc_end0-fuse_reshape | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_reshape_compute_ # -- Begin function fuse_reshape_compute_ | |
| .p2align 2 | |
| .type fuse_reshape_compute_,@function | |
| fuse_reshape_compute_: # @fuse_reshape_compute_ | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| sd s2, 0(sp) | |
| mv s0, a1 | |
| mv s1, a0 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 112 | |
| addi a1, s0, 112 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 224 | |
| addi a1, s0, 224 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 336 | |
| addi a1, s0, 336 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 448 | |
| addi a1, s0, 448 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 560 | |
| addi a1, s0, 560 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 672 | |
| addi a1, s0, 672 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 784 | |
| addi a1, s0, 784 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 896 | |
| addi a1, s0, 896 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1008 | |
| addi a1, s0, 1008 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1120 | |
| addi a1, s0, 1120 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1232 | |
| addi a1, s0, 1232 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1344 | |
| addi a1, s0, 1344 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1456 | |
| addi a1, s0, 1456 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1568 | |
| addi a1, s0, 1568 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1680 | |
| addi a1, s0, 1680 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1792 | |
| addi a1, s0, 1792 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 1904 | |
| addi a1, s0, 1904 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addi a0, s1, 2016 | |
| addi a1, s0, 2016 | |
| addi a2, zero, 112 | |
| call memcpy | |
| lui s2, 1 | |
| addiw a1, s2, -1968 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1856 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1744 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1632 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1520 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1408 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1296 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1184 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| addiw a1, s2, -1072 | |
| add a0, s1, a1 | |
| add a1, s0, a1 | |
| addi a2, zero, 112 | |
| call memcpy | |
| ld s2, 0(sp) | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| addi sp, sp, 32 | |
| ret | |
| .Lfunc_end1: | |
| .size fuse_reshape_compute_, .Lfunc_end1-fuse_reshape_compute_ | |
| # -- End function | |
| .globl fuse_conv2d # -- Begin function fuse_conv2d | |
| .p2align 2 | |
| .type fuse_conv2d,@function | |
| fuse_conv2d: # @fuse_conv2d | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -64 | |
| .cfi_def_cfa_offset 64 | |
| sd ra, 56(sp) | |
| sd s0, 48(sp) | |
| sd s1, 40(sp) | |
| sd s2, 32(sp) | |
| sd s3, 24(sp) | |
| sd s4, 16(sp) | |
| sd s5, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| .cfi_offset s2, -32 | |
| .cfi_offset s3, -40 | |
| .cfi_offset s4, -48 | |
| .cfi_offset s5, -56 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 4 | |
| bne a2, a3, .LBB2_74 | |
| # %bb.1: # %assert_end | |
| lwu t5, 12(a1) | |
| ld a6, 24(a0) | |
| lwu t6, 8(a1) | |
| ld a7, 16(a0) | |
| lwu s3, 4(a1) | |
| ld t3, 8(a0) | |
| lwu s4, 0(a1) | |
| ld s5, 0(a0) | |
| ld t4, 24(s5) | |
| ld a0, 0(s5) | |
| ld a1, 32(s5) | |
| beqz a1, .LBB2_6 | |
| # %bb.2: # %if_then | |
| lw a3, 0(a1) | |
| addi a2, zero, 784 | |
| bne a3, a2, .LBB2_75 | |
| # %bb.3: # %if_then | |
| ld a3, 8(a1) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| bne a3, a2, .LBB2_75 | |
| # %bb.4: # %if_then | |
| ld a2, 16(a1) | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 28 | |
| bne a2, a3, .LBB2_75 | |
| # %bb.5: # %if_then | |
| ld a1, 24(a1) | |
| slli a1, a1, 32 | |
| srli a1, a1, 32 | |
| addi a2, zero, 1 | |
| bne a1, a2, .LBB2_75 | |
| .LBB2_6: # %if_end | |
| ld t2, 24(t3) | |
| ld a1, 0(t3) | |
| lwu a4, 12(s5) | |
| lwu s2, 8(s5) | |
| ld a2, 32(t3) | |
| beqz a2, .LBB2_11 | |
| # %bb.7: # %if_then3 | |
| lw s0, 0(a2) | |
| addi a3, zero, 25 | |
| bne s0, a3, .LBB2_76 | |
| # %bb.8: # %if_then3 | |
| ld s0, 8(a2) | |
| slli s0, s0, 32 | |
| srli s0, s0, 32 | |
| bne s0, a3, .LBB2_76 | |
| # %bb.9: # %if_then3 | |
| ld a3, 16(a2) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 5 | |
| bne a3, s0, .LBB2_76 | |
| # %bb.10: # %if_then3 | |
| ld a2, 24(a2) | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 1 | |
| bne a2, a3, .LBB2_76 | |
| .LBB2_11: # %if_end4 | |
| ld t1, 24(a7) | |
| ld a3, 0(a7) | |
| ld a2, 32(a7) | |
| beqz a2, .LBB2_13 | |
| # %bb.12: # %if_then7 | |
| lw a2, 0(a2) | |
| addi s0, zero, 1 | |
| bne a2, s0, .LBB2_77 | |
| .LBB2_13: # %if_end8 | |
| ld t0, 24(a6) | |
| ld a2, 0(a6) | |
| ld s0, 32(a6) | |
| beqz s0, .LBB2_18 | |
| # %bb.14: # %if_then11 | |
| lui s1, 6 | |
| addiw s1, s1, 512 | |
| lw a5, 0(s0) | |
| bne a5, s1, .LBB2_78 | |
| # %bb.15: # %if_then11 | |
| ld a5, 8(s0) | |
| slli a5, a5, 32 | |
| srli a5, a5, 32 | |
| addi s1, zero, 784 | |
| bne a5, s1, .LBB2_78 | |
| # %bb.16: # %if_then11 | |
| ld a5, 16(s0) | |
| slli a5, a5, 32 | |
| srli a5, a5, 32 | |
| addi s1, zero, 28 | |
| bne a5, s1, .LBB2_78 | |
| # %bb.17: # %if_then11 | |
| ld a5, 24(s0) | |
| slli a5, a5, 32 | |
| srli a5, a5, 32 | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB2_78 | |
| .LBB2_18: # %if_end12 | |
| addi a5, zero, 13 | |
| bltu a5, s4, .LBB2_67 | |
| # %bb.19: # %if_end12 | |
| addi a5, zero, 1 | |
| sll a5, a5, s4 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a5, a5, s0 | |
| beqz a5, .LBB2_67 | |
| # %bb.20: # %assert_end16 | |
| addi a5, zero, 13 | |
| bltu a5, s3, .LBB2_68 | |
| # %bb.21: # %assert_end16 | |
| addi a5, zero, 1 | |
| sll a5, a5, s3 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a5, a5, s0 | |
| beqz a5, .LBB2_68 | |
| # %bb.22: # %assert_end18 | |
| addi a5, zero, 13 | |
| bltu a5, t6, .LBB2_69 | |
| # %bb.23: # %assert_end18 | |
| addi a5, zero, 1 | |
| sll a5, a5, t6 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a5, a5, s1 | |
| beqz a5, .LBB2_69 | |
| # %bb.24: # %assert_end20 | |
| addi a5, zero, 13 | |
| bltu a5, t5, .LBB2_70 | |
| # %bb.25: # %assert_end20 | |
| addi s1, zero, 1 | |
| sll a5, s1, t5 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a5, a5, s0 | |
| beqz a5, .LBB2_70 | |
| # %bb.26: # %assert_end22 | |
| bne s2, s1, .LBB2_79 | |
| # %bb.27: # %assert_end24 | |
| lw a5, 16(s5) | |
| addi s1, zero, 4 | |
| bne a5, s1, .LBB2_80 | |
| # %bb.28: # %assert_end26 | |
| lhu a5, 22(s5) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB2_81 | |
| # %bb.29: # %assert_end26 | |
| lbu a5, 21(s5) | |
| addi s1, zero, 32 | |
| bne a5, s1, .LBB2_81 | |
| # %bb.30: # %assert_end26 | |
| lbu a5, 20(s5) | |
| addi s1, zero, 2 | |
| bne a5, s1, .LBB2_81 | |
| # %bb.31: # %assert_end28 | |
| lw a5, 0(t4) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB2_82 | |
| # %bb.32: # %assert_end30 | |
| lw a5, 8(t4) | |
| bne a5, s0, .LBB2_83 | |
| # %bb.33: # %assert_end32 | |
| lw a5, 16(t4) | |
| addi s1, zero, 28 | |
| bne a5, s1, .LBB2_84 | |
| # %bb.34: # %assert_end34 | |
| lw a5, 24(t4) | |
| bne a5, s1, .LBB2_85 | |
| # %bb.35: # %assert_end36 | |
| ld a5, 40(s5) | |
| bnez a5, .LBB2_86 | |
| # %bb.36: # %assert_end38 | |
| lw a5, 16(t3) | |
| addi s1, zero, 4 | |
| bne a5, s1, .LBB2_87 | |
| # %bb.37: # %assert_end40 | |
| lhu a5, 22(t3) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB2_88 | |
| # %bb.38: # %assert_end40 | |
| lbu a5, 21(t3) | |
| addi s1, zero, 32 | |
| bne a5, s1, .LBB2_88 | |
| # %bb.39: # %assert_end40 | |
| lbu a5, 20(t3) | |
| addi s1, zero, 2 | |
| bne a5, s1, .LBB2_88 | |
| # %bb.40: # %assert_end42 | |
| lw a5, 0(t2) | |
| addi s1, zero, 32 | |
| bne a5, s1, .LBB2_89 | |
| # %bb.41: # %assert_end44 | |
| lw a5, 8(t2) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB2_90 | |
| # %bb.42: # %assert_end46 | |
| lw s1, 16(t2) | |
| addi a5, zero, 5 | |
| bne s1, a5, .LBB2_91 | |
| # %bb.43: # %assert_end48 | |
| lw s1, 24(t2) | |
| bne s1, a5, .LBB2_92 | |
| # %bb.44: # %assert_end50 | |
| ld a5, 40(t3) | |
| bnez a5, .LBB2_93 | |
| # %bb.45: # %assert_end52 | |
| lw a5, 8(t3) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB2_94 | |
| # %bb.46: # %assert_end54 | |
| lw s1, 12(t3) | |
| sext.w a5, a4 | |
| bne a5, s1, .LBB2_95 | |
| # %bb.47: # %assert_end56 | |
| lw s1, 16(a7) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB2_96 | |
| # %bb.48: # %assert_end58 | |
| lhu s1, 22(a7) | |
| bne s1, s0, .LBB2_97 | |
| # %bb.49: # %assert_end58 | |
| lbu s1, 21(a7) | |
| addi s0, zero, 32 | |
| bne s1, s0, .LBB2_97 | |
| # %bb.50: # %assert_end58 | |
| lbu s1, 20(a7) | |
| addi s0, zero, 2 | |
| bne s1, s0, .LBB2_97 | |
| # %bb.51: # %assert_end60 | |
| lw s1, 0(t1) | |
| addi s0, zero, 32 | |
| bne s1, s0, .LBB2_98 | |
| # %bb.52: # %assert_end62 | |
| ld s1, 40(a7) | |
| bnez s1, .LBB2_99 | |
| # %bb.53: # %assert_end64 | |
| lw s1, 8(a7) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB2_100 | |
| # %bb.54: # %assert_end66 | |
| lw s1, 12(a7) | |
| bne a5, s1, .LBB2_101 | |
| # %bb.55: # %assert_end68 | |
| lw s1, 16(a6) | |
| addi s0, zero, 4 | |
| bne s1, s0, .LBB2_102 | |
| # %bb.56: # %assert_end70 | |
| lhu s1, 22(a6) | |
| addi s2, zero, 1 | |
| bne s1, s2, .LBB2_103 | |
| # %bb.57: # %assert_end70 | |
| lbu s1, 21(a6) | |
| addi s0, zero, 32 | |
| bne s1, s0, .LBB2_103 | |
| # %bb.58: # %assert_end70 | |
| lbu s1, 20(a6) | |
| addi s0, zero, 2 | |
| bne s1, s0, .LBB2_103 | |
| # %bb.59: # %assert_end72 | |
| lw s1, 0(t0) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB2_104 | |
| # %bb.60: # %assert_end74 | |
| lw s1, 8(t0) | |
| addi s0, zero, 32 | |
| bne s1, s0, .LBB2_105 | |
| # %bb.61: # %assert_end76 | |
| lw s0, 16(t0) | |
| addi s1, zero, 28 | |
| bne s0, s1, .LBB2_106 | |
| # %bb.62: # %assert_end78 | |
| lw s0, 24(t0) | |
| bne s0, s1, .LBB2_107 | |
| # %bb.63: # %assert_end80 | |
| ld s1, 40(a6) | |
| bnez s1, .LBB2_108 | |
| # %bb.64: # %assert_end82 | |
| lw s1, 8(a6) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB2_109 | |
| # %bb.65: # %assert_end84 | |
| lw s1, 12(a6) | |
| bne a5, s1, .LBB2_111 | |
| # %bb.66: # %assert_end86 | |
| call fuse_conv2d_compute_ | |
| mv a0, zero | |
| j .LBB2_73 | |
| .LBB2_67: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.25) | |
| addi a0, a0, %lo(.L.str.25) | |
| j .LBB2_71 | |
| .LBB2_68: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.26) | |
| addi a0, a0, %lo(.L.str.26) | |
| j .LBB2_71 | |
| .LBB2_69: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.27) | |
| addi a0, a0, %lo(.L.str.27) | |
| j .LBB2_71 | |
| .LBB2_70: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.28) | |
| addi a0, a0, %lo(.L.str.28) | |
| .LBB2_71: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB2_72: # %assert_fail9 | |
| addi a0, a0, -1 | |
| .LBB2_73: # %assert_fail9 | |
| ld s5, 8(sp) | |
| ld s4, 16(sp) | |
| ld s3, 24(sp) | |
| ld s2, 32(sp) | |
| ld s1, 40(sp) | |
| ld s0, 48(sp) | |
| ld ra, 56(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| .cfi_restore s2 | |
| .cfi_restore s3 | |
| .cfi_restore s4 | |
| .cfi_restore s5 | |
| addi sp, sp, 64 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB2_74: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.20) | |
| addi a0, a0, %lo(.L.str.20) | |
| j .LBB2_71 | |
| .LBB2_75: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.21) | |
| addi a0, a0, %lo(.L.str.21) | |
| j .LBB2_71 | |
| .LBB2_76: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.22) | |
| addi a0, a0, %lo(.L.str.22) | |
| j .LBB2_71 | |
| .LBB2_77: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.23) | |
| addi a0, a0, %lo(.L.str.23) | |
| j .LBB2_110 | |
| .LBB2_78: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.24) | |
| addi a0, a0, %lo(.L.str.24) | |
| j .LBB2_71 | |
| .LBB2_79: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB2_71 | |
| .LBB2_80: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.29) | |
| addi a0, a0, %lo(.L.str.29) | |
| j .LBB2_71 | |
| .LBB2_81: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB2_110 | |
| .LBB2_82: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB2_110 | |
| .LBB2_83: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.30) | |
| addi a0, a0, %lo(.L.str.30) | |
| j .LBB2_71 | |
| .LBB2_84: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.31) | |
| addi a0, a0, %lo(.L.str.31) | |
| j .LBB2_71 | |
| .LBB2_85: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.32) | |
| addi a0, a0, %lo(.L.str.32) | |
| j .LBB2_71 | |
| .LBB2_86: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB2_71 | |
| .LBB2_87: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.11) | |
| addi a0, a0, %lo(.L.str.11) | |
| j .LBB2_71 | |
| .LBB2_88: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB2_110 | |
| .LBB2_89: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.33) | |
| addi a0, a0, %lo(.L.str.33) | |
| j .LBB2_71 | |
| .LBB2_90: # %assert_fail45 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.14) | |
| addi a0, a0, %lo(.L.str.14) | |
| j .LBB2_110 | |
| .LBB2_91: # %assert_fail47 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.34) | |
| addi a0, a0, %lo(.L.str.34) | |
| j .LBB2_71 | |
| .LBB2_92: # %assert_fail49 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.35) | |
| addi a0, a0, %lo(.L.str.35) | |
| j .LBB2_71 | |
| .LBB2_93: # %assert_fail51 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB2_71 | |
| .LBB2_94: # %assert_fail53 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| j .LBB2_110 | |
| .LBB2_95: # %assert_fail55 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB2_71 | |
| .LBB2_96: # %assert_fail57 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.36) | |
| addi a0, a0, %lo(.L.str.36) | |
| j .LBB2_110 | |
| .LBB2_97: # %assert_fail59 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.37) | |
| addi a0, a0, %lo(.L.str.37) | |
| j .LBB2_71 | |
| .LBB2_98: # %assert_fail61 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.38) | |
| addi a0, a0, %lo(.L.str.38) | |
| j .LBB2_71 | |
| .LBB2_99: # %assert_fail63 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.39) | |
| addi a0, a0, %lo(.L.str.39) | |
| j .LBB2_71 | |
| .LBB2_100: # %assert_fail65 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.40) | |
| addi a0, a0, %lo(.L.str.40) | |
| j .LBB2_110 | |
| .LBB2_101: # %assert_fail67 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.41) | |
| addi a0, a0, %lo(.L.str.41) | |
| j .LBB2_71 | |
| .LBB2_102: # %assert_fail69 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.42) | |
| addi a0, a0, %lo(.L.str.42) | |
| j .LBB2_71 | |
| .LBB2_103: # %assert_fail71 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.43) | |
| addi a0, a0, %lo(.L.str.43) | |
| jalr a1 | |
| slli a0, s2, 32 | |
| j .LBB2_72 | |
| .LBB2_104: # %assert_fail73 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.44) | |
| addi a0, a0, %lo(.L.str.44) | |
| j .LBB2_110 | |
| .LBB2_105: # %assert_fail75 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.45) | |
| addi a0, a0, %lo(.L.str.45) | |
| j .LBB2_71 | |
| .LBB2_106: # %assert_fail77 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.46) | |
| addi a0, a0, %lo(.L.str.46) | |
| j .LBB2_71 | |
| .LBB2_107: # %assert_fail79 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.47) | |
| addi a0, a0, %lo(.L.str.47) | |
| j .LBB2_71 | |
| .LBB2_108: # %assert_fail81 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.48) | |
| addi a0, a0, %lo(.L.str.48) | |
| j .LBB2_71 | |
| .LBB2_109: # %assert_fail83 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.49) | |
| addi a0, a0, %lo(.L.str.49) | |
| .LBB2_110: # %assert_fail9 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB2_72 | |
| .LBB2_111: # %assert_fail85 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.50) | |
| addi a0, a0, %lo(.L.str.50) | |
| j .LBB2_71 | |
| .Lfunc_end2: | |
| .size fuse_conv2d, .Lfunc_end2-fuse_conv2d | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_conv2d_compute_ | |
| .LCPI3_0: | |
| .word 0 # float 0 | |
| .text | |
| .globl fuse_conv2d_compute_ | |
| .p2align 2 | |
| .type fuse_conv2d_compute_,@function | |
| fuse_conv2d_compute_: # @fuse_conv2d_compute_ | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -416 | |
| .cfi_def_cfa_offset 416 | |
| sd ra, 408(sp) | |
| sd s0, 400(sp) | |
| sd s1, 392(sp) | |
| sd s2, 384(sp) | |
| sd s3, 376(sp) | |
| sd s4, 368(sp) | |
| sd s5, 360(sp) | |
| sd s6, 352(sp) | |
| sd s7, 344(sp) | |
| sd s8, 336(sp) | |
| sd s9, 328(sp) | |
| sd s10, 320(sp) | |
| sd s11, 312(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| .cfi_offset s2, -32 | |
| .cfi_offset s3, -40 | |
| .cfi_offset s4, -48 | |
| .cfi_offset s5, -56 | |
| .cfi_offset s6, -64 | |
| .cfi_offset s7, -72 | |
| .cfi_offset s8, -80 | |
| .cfi_offset s9, -88 | |
| .cfi_offset s10, -96 | |
| .cfi_offset s11, -104 | |
| sd a3, 24(sp) | |
| sd a2, 16(sp) | |
| mv s6, a1 | |
| mv s7, a0 | |
| lui s0, 1 | |
| lui a0, 1 | |
| call _Znam | |
| mv s8, a0 | |
| addiw a0, s0, -896 | |
| call _Znam | |
| sd a0, 40(sp) | |
| lui a0, 25 | |
| addiw s5, a0, -2048 | |
| mv a0, s5 | |
| call _Znam | |
| mv s3, a0 | |
| mv a0, s5 | |
| call _Znam | |
| sd a0, 8(sp) | |
| addi s2, s7, -232 | |
| addi s1, zero, 27 | |
| lui a0, %hi(.LCPI3_0) | |
| addi a0, a0, %lo(.LCPI3_0) | |
| flw ft1, 0(a0) | |
| addi s0, zero, 32 | |
| mv s4, s8 | |
| mv s5, zero | |
| fsw ft1, 304(sp) | |
| addiw a0, s5, -2 | |
| bgeu s1, a0, .LBB3_4 | |
| .LBB3_1: # %for_body8.preheader | |
| slli a0, s5, 7 | |
| add a0, s8, a0 | |
| mv a1, zero | |
| addi a2, zero, 128 | |
| call memset | |
| flw ft1, 304(sp) | |
| .LBB3_2: # %for_end9 | |
| addi s4, s4, 128 | |
| addi s2, s2, 112 | |
| addi s5, s5, 1 | |
| beq s5, s0, .LBB3_8 | |
| # %bb.3: # %for_begin7.preheader | |
| addiw a0, s5, -2 | |
| bltu s1, a0, .LBB3_1 | |
| .LBB3_4: # %for_body8.us.preheader | |
| mv a0, s4 | |
| mv a1, s2 | |
| mv a2, zero | |
| j .LBB3_6 | |
| .LBB3_5: # %if_end11.us | |
| # in Loop: Header=BB3_6 Depth=1 | |
| fsw ft0, 0(a0) | |
| addi a0, a0, 4 | |
| addi a1, a1, 4 | |
| addi a2, a2, 1 | |
| beq a2, s0, .LBB3_2 | |
| .LBB3_6: # %for_body8.us | |
| # =>This Inner Loop Header: Depth=1 | |
| addiw a3, a2, -2 | |
| fmv.s ft0, ft1 | |
| bltu s1, a3, .LBB3_5 | |
| # %bb.7: # %if_then10.us | |
| # in Loop: Header=BB3_6 Depth=1 | |
| flw ft0, 0(a1) | |
| j .LBB3_5 | |
| .LBB3_8: # %for_begin12.preheader | |
| addi a0, s6, 400 | |
| ld a1, 40(sp) | |
| addi a1, a1, 80 | |
| addi a2, zero, 4 | |
| mv a3, zero | |
| .LBB3_9: # %for_begin15.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB3_10 Depth 2 | |
| addi a4, zero, -100 | |
| mv a5, a1 | |
| .LBB3_10: # %for_begin18.preheader | |
| # Parent Loop BB3_9 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add s0, a0, a4 | |
| flw ft0, -300(s0) | |
| fsw ft0, -80(a5) | |
| flw ft0, -200(s0) | |
| fsw ft0, -76(a5) | |
| flw ft0, -100(s0) | |
| fsw ft0, -72(a5) | |
| flw ft0, 0(s0) | |
| fsw ft0, -68(a5) | |
| flw ft0, 100(s0) | |
| fsw ft0, -64(a5) | |
| flw ft0, 200(s0) | |
| fsw ft0, -60(a5) | |
| flw ft0, 300(s0) | |
| fsw ft0, -56(a5) | |
| flw ft0, 400(s0) | |
| fsw ft0, -52(a5) | |
| flw ft0, -296(s0) | |
| fsw ft0, -48(a5) | |
| flw ft0, -196(s0) | |
| fsw ft0, -44(a5) | |
| flw ft0, -96(s0) | |
| fsw ft0, -40(a5) | |
| flw ft0, 4(s0) | |
| fsw ft0, -36(a5) | |
| flw ft0, 104(s0) | |
| fsw ft0, -32(a5) | |
| flw ft0, 204(s0) | |
| fsw ft0, -28(a5) | |
| flw ft0, 304(s0) | |
| fsw ft0, -24(a5) | |
| flw ft0, 404(s0) | |
| fsw ft0, -20(a5) | |
| flw ft0, -292(s0) | |
| fsw ft0, -16(a5) | |
| flw ft0, -192(s0) | |
| fsw ft0, -12(a5) | |
| flw ft0, -92(s0) | |
| fsw ft0, -8(a5) | |
| flw ft0, 8(s0) | |
| fsw ft0, -4(a5) | |
| flw ft0, 108(s0) | |
| fsw ft0, 0(a5) | |
| flw ft0, 208(s0) | |
| fsw ft0, 4(a5) | |
| flw ft0, 308(s0) | |
| fsw ft0, 8(a5) | |
| flw ft0, 408(s0) | |
| fsw ft0, 12(a5) | |
| flw ft0, -288(s0) | |
| fsw ft0, 16(a5) | |
| flw ft0, -188(s0) | |
| fsw ft0, 20(a5) | |
| flw ft0, -88(s0) | |
| fsw ft0, 24(a5) | |
| flw ft0, 12(s0) | |
| fsw ft0, 28(a5) | |
| flw ft0, 112(s0) | |
| fsw ft0, 32(a5) | |
| flw ft0, 212(s0) | |
| fsw ft0, 36(a5) | |
| flw ft0, 312(s0) | |
| fsw ft0, 40(a5) | |
| flw ft0, 412(s0) | |
| fsw ft0, 44(a5) | |
| flw ft0, -284(s0) | |
| fsw ft0, 48(a5) | |
| flw ft0, -184(s0) | |
| fsw ft0, 52(a5) | |
| flw ft0, -84(s0) | |
| fsw ft0, 56(a5) | |
| flw ft0, 16(s0) | |
| fsw ft0, 60(a5) | |
| flw ft0, 116(s0) | |
| fsw ft0, 64(a5) | |
| flw ft0, 216(s0) | |
| fsw ft0, 68(a5) | |
| flw ft0, 316(s0) | |
| fsw ft0, 72(a5) | |
| flw ft0, 416(s0) | |
| fsw ft0, 76(a5) | |
| addi a5, a5, 160 | |
| addi a4, a4, 20 | |
| bnez a4, .LBB3_10 | |
| # %bb.11: # %for_end17 | |
| # in Loop: Header=BB3_9 Depth=1 | |
| addi a0, a0, 800 | |
| addi a1, a1, 800 | |
| addi a3, a3, 1 | |
| bne a3, a2, .LBB3_9 | |
| # %bb.12: # %for_begin24.preheader | |
| sd s8, 288(sp) | |
| lui a0, 131072 | |
| addiw a0, a0, -1 | |
| sd a0, 32(sp) | |
| addi a6, zero, 28 | |
| addi a4, zero, 8 | |
| addi a5, zero, 4 | |
| addi a3, zero, 1 | |
| addi a0, zero, 2 | |
| addi a2, zero, 3 | |
| mv s0, zero | |
| .LBB3_13: # %for_begin27.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB3_14 Depth 2 | |
| # Child Loop BB3_16 Depth 2 | |
| # Child Loop BB3_17 Depth 3 | |
| srli a1, s0, 3 | |
| ld s1, 32(sp) | |
| and a1, a1, s1 | |
| sd s0, 48(sp) | |
| andi s1, s0, 7 | |
| sd s1, 304(sp) | |
| sd a1, 248(sp) | |
| mul a1, a1, a6 | |
| sd a1, 160(sp) | |
| mv t3, zero | |
| .LBB3_14: # %for_begin30.preheader | |
| # Parent Loop BB3_13 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| ld a1, 160(sp) | |
| add a1, t3, a1 | |
| addi s1, zero, 224 | |
| mul a1, a1, s1 | |
| ld s1, 304(sp) | |
| or a1, a1, s1 | |
| sext.w s0, a1 | |
| slli s0, s0, 2 | |
| add s0, s3, s0 | |
| sw zero, 0(s0) | |
| ori s0, a1, 8 | |
| sext.w s0, s0 | |
| slli s0, s0, 2 | |
| add s0, s3, s0 | |
| sw zero, 0(s0) | |
| ori s0, a1, 16 | |
| sext.w s0, s0 | |
| slli s0, s0, 2 | |
| add s0, s3, s0 | |
| sw zero, 0(s0) | |
| ori s0, a1, 24 | |
| sext.w s0, s0 | |
| slli s0, s0, 2 | |
| add s0, s3, s0 | |
| sw zero, 0(s0) | |
| addiw s0, a1, 32 | |
| slli s0, s0, 2 | |
| add s0, s3, s0 | |
| sw zero, 0(s0) | |
| addiw s0, a1, 40 | |
| slli s0, s0, 2 | |
| add s0, s3, s0 | |
| sw zero, 0(s0) | |
| addiw s0, a1, 160 | |
| slli s1, s0, 2 | |
| sd s1, 280(sp) | |
| addiw s0, a1, 168 | |
| slli t1, s0, 2 | |
| addiw s0, a1, 176 | |
| slli t2, s0, 2 | |
| addiw s0, a1, 184 | |
| slli a7, s0, 2 | |
| addiw s0, a1, 192 | |
| slli t4, s0, 2 | |
| addiw s0, a1, 200 | |
| slli t5, s0, 2 | |
| addiw s0, a1, 208 | |
| slli t6, s0, 2 | |
| addiw s0, a1, 216 | |
| slli s2, s0, 2 | |
| addiw s0, a1, 104 | |
| slli s1, s0, 2 | |
| sd s1, 256(sp) | |
| addiw s0, a1, 112 | |
| slli s4, s0, 2 | |
| addiw s0, a1, 120 | |
| slli s5, s0, 2 | |
| addiw s0, a1, 128 | |
| slli s6, s0, 2 | |
| addiw s0, a1, 136 | |
| slli s7, s0, 2 | |
| addiw s0, a1, 144 | |
| slli s8, s0, 2 | |
| addiw s0, a1, 152 | |
| slli s9, s0, 2 | |
| addiw s0, a1, 64 | |
| slli s10, s0, 2 | |
| addiw s0, a1, 72 | |
| slli s11, s0, 2 | |
| addiw s0, a1, 80 | |
| slli s0, s0, 2 | |
| addiw a6, a1, 88 | |
| slli a6, a6, 2 | |
| addiw t0, a1, 96 | |
| slli t0, t0, 2 | |
| add s1, s3, s2 | |
| sd s1, 296(sp) | |
| add s1, s3, t6 | |
| sd s1, 272(sp) | |
| add s1, s3, t5 | |
| sd s1, 264(sp) | |
| add t6, s3, t4 | |
| add t5, s3, a7 | |
| add t4, s3, t2 | |
| add t2, s3, t1 | |
| ld s1, 280(sp) | |
| add t1, s3, s1 | |
| add s9, s3, s9 | |
| add s8, s3, s8 | |
| add s7, s3, s7 | |
| add s6, s3, s6 | |
| add s5, s3, s5 | |
| add s4, s3, s4 | |
| ld s1, 256(sp) | |
| add s1, s3, s1 | |
| add t0, s3, t0 | |
| add a6, s3, a6 | |
| add a7, s3, s0 | |
| add s11, s3, s11 | |
| add s10, s3, s10 | |
| addiw s2, a1, 56 | |
| slli s0, s2, 2 | |
| add s0, s3, s0 | |
| addiw a1, a1, 48 | |
| slli a1, a1, 2 | |
| add a1, s3, a1 | |
| sw zero, 0(a1) | |
| sw zero, 0(s0) | |
| sw zero, 0(s10) | |
| sw zero, 0(s11) | |
| sw zero, 0(a7) | |
| sw zero, 0(a6) | |
| sw zero, 0(t0) | |
| sw zero, 0(s1) | |
| sw zero, 0(s4) | |
| sw zero, 0(s5) | |
| sw zero, 0(s6) | |
| sw zero, 0(s7) | |
| sw zero, 0(s8) | |
| sw zero, 0(s9) | |
| sw zero, 0(t1) | |
| sw zero, 0(t2) | |
| sw zero, 0(t4) | |
| sw zero, 0(t5) | |
| sw zero, 0(t6) | |
| ld a1, 264(sp) | |
| sw zero, 0(a1) | |
| ld a1, 272(sp) | |
| sw zero, 0(a1) | |
| ld a1, 296(sp) | |
| sw zero, 0(a1) | |
| addi a1, t3, 1 | |
| addiw s0, t3, 1 | |
| mv t3, a1 | |
| addi a1, zero, 28 | |
| bltu s0, a1, .LBB3_14 | |
| # %bb.15: # %for_begin33.preheader | |
| # in Loop: Header=BB3_13 Depth=1 | |
| ld a1, 160(sp) | |
| addi a1, zero, 200 | |
| ld s1, 248(sp) | |
| mul a1, s1, a1 | |
| ld s1, 304(sp) | |
| or a1, a1, s1 | |
| addi s0, a1, 184 | |
| slli a6, s0, 32 | |
| addi s0, a1, 192 | |
| slli s0, s0, 32 | |
| srli a7, s0, 32 | |
| srli a6, a6, 32 | |
| addi s0, a1, 8 | |
| slli t0, s0, 32 | |
| addi s0, a1, 16 | |
| slli t1, s0, 32 | |
| addi s0, a1, 24 | |
| slli t2, s0, 32 | |
| addi s0, a1, 32 | |
| slli t3, s0, 32 | |
| addi s0, a1, 40 | |
| slli t4, s0, 32 | |
| addi s0, a1, 96 | |
| slli t5, s0, 32 | |
| addi s0, a1, 152 | |
| slli s1, s0, 32 | |
| sd s1, 280(sp) | |
| addi s0, a1, 48 | |
| slli s2, s0, 32 | |
| addi s0, a1, 56 | |
| slli s1, s0, 32 | |
| addi s0, a1, 64 | |
| slli s4, s0, 32 | |
| addi s0, a1, 72 | |
| slli s5, s0, 32 | |
| addi s0, a1, 80 | |
| slli s6, s0, 32 | |
| addi s0, a1, 88 | |
| slli s7, s0, 32 | |
| slli s0, a1, 32 | |
| srli s8, s0, 32 | |
| srli s0, t4, 32 | |
| sd s0, 296(sp) | |
| srli s0, t3, 32 | |
| sd s0, 256(sp) | |
| srli s0, t2, 32 | |
| sd s0, 248(sp) | |
| srli s0, t1, 32 | |
| sd s0, 240(sp) | |
| srli s0, t0, 32 | |
| sd s0, 232(sp) | |
| slli s0, a6, 2 | |
| sd s0, 264(sp) | |
| slli t0, a7, 2 | |
| addi s0, a1, 168 | |
| slli s9, s0, 32 | |
| addi s0, a1, 104 | |
| slli s10, s0, 32 | |
| addi s0, a1, 112 | |
| slli s11, s0, 32 | |
| addi s0, a1, 120 | |
| slli a6, s0, 32 | |
| addi t4, a1, 128 | |
| slli t4, t4, 32 | |
| addi t6, a1, 136 | |
| slli t6, t6, 32 | |
| addi t3, a1, 144 | |
| slli t3, t3, 32 | |
| slli s8, s8, 2 | |
| addi t2, a1, 160 | |
| slli t2, t2, 32 | |
| srli t5, t5, 32 | |
| srli s7, s7, 32 | |
| srli s6, s6, 32 | |
| srli s5, s5, 32 | |
| srli s4, s4, 32 | |
| srli s1, s1, 32 | |
| srli s2, s2, 32 | |
| ld s0, 280(sp) | |
| srli t1, s0, 32 | |
| srli t3, t3, 32 | |
| srli t6, t6, 32 | |
| srli t4, t4, 32 | |
| srli a7, a6, 32 | |
| srli s11, s11, 32 | |
| srli s10, s10, 32 | |
| srli s9, s9, 32 | |
| srli t2, t2, 32 | |
| ld a6, 40(sp) | |
| add s0, a6, s8 | |
| sd s0, 280(sp) | |
| add s0, a6, t0 | |
| sd s0, 272(sp) | |
| ld s0, 264(sp) | |
| add s0, a6, s0 | |
| sd s0, 264(sp) | |
| ld s0, 232(sp) | |
| slli s0, s0, 2 | |
| sd s0, 152(sp) | |
| ld s0, 240(sp) | |
| slli s0, s0, 2 | |
| sd s0, 144(sp) | |
| ld s0, 248(sp) | |
| slli s0, s0, 2 | |
| sd s0, 136(sp) | |
| ld s0, 256(sp) | |
| slli s0, s0, 2 | |
| sd s0, 80(sp) | |
| ld s0, 296(sp) | |
| slli s0, s0, 2 | |
| sd s0, 296(sp) | |
| slli s0, s2, 2 | |
| sd s0, 96(sp) | |
| slli s8, s1, 2 | |
| slli s2, s4, 2 | |
| slli s5, s5, 2 | |
| slli s4, s6, 2 | |
| slli t0, s7, 2 | |
| slli t5, t5, 2 | |
| slli s10, s10, 2 | |
| slli s6, s11, 2 | |
| slli s7, a7, 2 | |
| slli t4, t4, 2 | |
| slli t6, t6, 2 | |
| slli t3, t3, 2 | |
| slli s1, t1, 2 | |
| slli t2, t2, 2 | |
| slli s0, s9, 2 | |
| addi a1, a1, 176 | |
| slli a1, a1, 32 | |
| srli a1, a1, 32 | |
| slli a1, a1, 2 | |
| add a1, a6, a1 | |
| sd a1, 256(sp) | |
| add a1, a6, s0 | |
| sd a1, 248(sp) | |
| add a1, a6, t2 | |
| sd a1, 240(sp) | |
| add a1, a6, s1 | |
| sd a1, 232(sp) | |
| add a1, a6, t3 | |
| sd a1, 224(sp) | |
| add a1, a6, t6 | |
| sd a1, 216(sp) | |
| add a1, a6, t4 | |
| sd a1, 208(sp) | |
| add a1, a6, s7 | |
| sd a1, 200(sp) | |
| add a1, a6, s6 | |
| sd a1, 192(sp) | |
| add a1, a6, s10 | |
| sd a1, 184(sp) | |
| add a1, a6, t5 | |
| sd a1, 176(sp) | |
| add a1, a6, t0 | |
| sd a1, 168(sp) | |
| add a1, a6, s4 | |
| sd a1, 128(sp) | |
| add a1, a6, s5 | |
| sd a1, 120(sp) | |
| add a1, a6, s2 | |
| sd a1, 112(sp) | |
| add a1, a6, s8 | |
| sd a1, 104(sp) | |
| ld a1, 96(sp) | |
| add a1, a6, a1 | |
| sd a1, 88(sp) | |
| ld a1, 296(sp) | |
| add a1, a6, a1 | |
| sd a1, 96(sp) | |
| ld a1, 80(sp) | |
| add a1, a6, a1 | |
| sd a1, 80(sp) | |
| ld a1, 136(sp) | |
| add a1, a6, a1 | |
| sd a1, 72(sp) | |
| ld a1, 144(sp) | |
| add a1, a6, a1 | |
| sd a1, 64(sp) | |
| ld a1, 152(sp) | |
| add a1, a6, a1 | |
| sd a1, 56(sp) | |
| mv s4, zero | |
| mv s1, zero | |
| mv s0, zero | |
| .LBB3_16: # %for_begin36.preheader | |
| # Parent Loop BB3_13 Depth=1 | |
| # => This Loop Header: Depth=2 | |
| # Child Loop BB3_17 Depth 3 | |
| sd s1, 144(sp) | |
| ld a1, 160(sp) | |
| sd s0, 136(sp) | |
| add a1, s0, a1 | |
| addi s10, zero, 7 | |
| mul a1, a1, s10 | |
| sd a1, 296(sp) | |
| sd s4, 152(sp) | |
| mv t0, zero | |
| ld s8, 128(sp) | |
| ld s9, 120(sp) | |
| ld s11, 112(sp) | |
| ld s5, 104(sp) | |
| ld t3, 96(sp) | |
| ld t5, 88(sp) | |
| ld s6, 80(sp) | |
| ld t4, 72(sp) | |
| ld t6, 64(sp) | |
| ld s7, 56(sp) | |
| .LBB3_17: # %for_body37 | |
| # Parent Loop BB3_13 Depth=1 | |
| # Parent Loop BB3_16 Depth=2 | |
| # => This Inner Loop Header: Depth=3 | |
| ld a1, 296(sp) | |
| add s1, t0, a1 | |
| slli s1, s1, 5 | |
| ld a1, 304(sp) | |
| or s1, s1, a1 | |
| vsetvl a1, a5, a4 | |
| ld a1, 288(sp) | |
| add a7, a1, s4 | |
| vle.v v0, ( a7 ) | |
| ld a1, 280(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v1, a1 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, a1 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, a1 | |
| ori a1, s1, 24 | |
| sext.w a1, a1 | |
| slli a1, a1, 2 | |
| add a6, s3, a1 | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| sext.w s0, s1 | |
| slli s0, s0, 2 | |
| add t1, s3, s0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v2, s0 | |
| vslide1up.vx v3, v2, a1 | |
| vfmul.vv v0, v0, v1 | |
| ori a1, s1, 16 | |
| sext.w a1, a1 | |
| slli a1, a1, 2 | |
| add s2, s3, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v3, a1 | |
| ori a1, s1, 8 | |
| sext.w a1, a1 | |
| slli a1, a1, 2 | |
| add t2, s3, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 4 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(s7) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 8 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(t6) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 12 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(t4) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 16 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(s6) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 128 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(t3) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 132 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(t5) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 136 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(s5) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 140 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(s11) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 144 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(s9) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 256 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| flw ft0, 0(s8) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 260 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 168(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 264 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 176(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 268 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 184(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 272 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 192(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 384 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 200(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 388 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 208(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 392 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 216(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 396 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 224(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 400 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 232(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 512 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 240(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 516 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 248(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 520 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 256(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 524 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s0, ft0 | |
| vmv.v.x v1, s0 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s0 | |
| ld a1, 264(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| vsetvl a1, a5, a4 | |
| addi a1, a7, 528 | |
| vle.v v0, ( a1 ) | |
| flw ft0, 0(a6) | |
| fmv.x.w a1, ft0 | |
| flw ft0, 0(t1) | |
| fmv.x.w s1, ft0 | |
| vmv.v.x v1, s1 | |
| vslide1up.vx v2, v1, a1 | |
| flw ft0, 0(s2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v1, v2, a1 | |
| flw ft0, 0(t2) | |
| fmv.x.w a1, ft0 | |
| vslide1up.vx v2, v1, a1 | |
| vslide1up.vx v1, v2, s1 | |
| ld a1, 272(sp) | |
| flw ft0, 0(a1) | |
| fmv.x.w a1, ft0 | |
| vmv.v.x v2, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vslide1up.vx v3, v2, a1 | |
| vslide1up.vx v2, v3, a1 | |
| vfmul.vv v0, v0, v2 | |
| vfadd.vv v0, v0, v1 | |
| vslideup.vx v1, v0, zero | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t1) | |
| vslideup.vx v1, v0, a3 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(t2) | |
| vslideup.vx v1, v0, a0 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(s2) | |
| vslideup.vx v1, v0, a2 | |
| vfmv.f.s ft0, v1 | |
| fsw ft0, 0(a6) | |
| addi s4, s4, 16 | |
| addi t0, t0, 1 | |
| addi s10, s10, -1 | |
| bnez s10, .LBB3_17 | |
| # %bb.18: # %for_end38 | |
| # in Loop: Header=BB3_16 Depth=2 | |
| ld s4, 152(sp) | |
| addi s4, s4, 128 | |
| ld s0, 136(sp) | |
| addi s0, s0, 1 | |
| ld s1, 144(sp) | |
| addi s1, s1, 1 | |
| addi a1, zero, 28 | |
| bne s1, a1, .LBB3_16 | |
| # %bb.19: # %for_end35 | |
| # in Loop: Header=BB3_13 Depth=1 | |
| ld s1, 48(sp) | |
| addi a1, s1, 1 | |
| addiw s1, s1, 1 | |
| mv s0, a1 | |
| addi a6, zero, 28 | |
| addi a1, zero, 32 | |
| bgeu s1, a1, .LBB3_20 | |
| j .LBB3_13 | |
| .LBB3_20: # %for_begin39.preheader | |
| addi t2, zero, 28 | |
| addi t6, zero, 112 | |
| lui a0, 1 | |
| addiw a7, a0, -960 | |
| addi a6, zero, 32 | |
| ld a0, 8(sp) | |
| mv t0, a0 | |
| mv t1, zero | |
| ld s2, 288(sp) | |
| .LBB3_21: # %for_begin42.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB3_22 Depth 2 | |
| # Child Loop BB3_23 Depth 3 | |
| srliw a1, t1, 3 | |
| mul t3, a1, t2 | |
| andi a3, t1, 7 | |
| mv a4, t0 | |
| mv t4, zero | |
| mv t5, zero | |
| .LBB3_22: # %for_begin45.preheader | |
| # Parent Loop BB3_21 Depth=1 | |
| # => This Loop Header: Depth=2 | |
| # Child Loop BB3_23 Depth 3 | |
| add a1, t5, t3 | |
| mul a1, a1, t2 | |
| mv s0, zero | |
| mv a2, zero | |
| .LBB3_23: # %for_body46 | |
| # Parent Loop BB3_21 Depth=1 | |
| # Parent Loop BB3_22 Depth=2 | |
| # => This Inner Loop Header: Depth=3 | |
| add s1, a2, a1 | |
| slli s1, s1, 3 | |
| or s1, s1, a3 | |
| sext.w s1, s1 | |
| slli s1, s1, 2 | |
| add s1, s3, s1 | |
| add a5, a4, s0 | |
| flw ft0, 0(s1) | |
| fsw ft0, 0(a5) | |
| addi a2, a2, 1 | |
| addi s0, s0, 4 | |
| bne s0, t6, .LBB3_23 | |
| # %bb.24: # %for_end47 | |
| # in Loop: Header=BB3_22 Depth=2 | |
| addi a4, a4, 112 | |
| addi t5, t5, 1 | |
| addi t4, t4, 1 | |
| bne t4, t2, .LBB3_22 | |
| # %bb.25: # %for_end44 | |
| # in Loop: Header=BB3_21 Depth=1 | |
| add t0, t0, a7 | |
| addi t1, t1, 1 | |
| bne t1, a6, .LBB3_21 | |
| # %bb.26: # %for_begin48.preheader | |
| addi s1, zero, 56 | |
| lui a1, 1 | |
| addiw a7, a1, -960 | |
| addi a6, zero, 32 | |
| mv a3, zero | |
| ld t0, 24(sp) | |
| ld a1, 16(sp) | |
| .LBB3_27: # %for_begin51.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB3_28 Depth 2 | |
| slli a2, a3, 2 | |
| add a2, t0, a2 | |
| addi a4, zero, 28 | |
| flw ft0, 0(a2) | |
| mv a5, s1 | |
| .LBB3_28: # %for_begin54.preheader | |
| # Parent Loop BB3_27 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add s0, a1, a5 | |
| add a2, a0, a5 | |
| flw ft1, -56(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -56(s0) | |
| flw ft1, -52(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -52(s0) | |
| flw ft1, -48(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -48(s0) | |
| flw ft1, -44(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -44(s0) | |
| flw ft1, -40(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -40(s0) | |
| flw ft1, -36(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -36(s0) | |
| flw ft1, -32(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -32(s0) | |
| flw ft1, -28(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -28(s0) | |
| flw ft1, -24(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -24(s0) | |
| flw ft1, -20(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -20(s0) | |
| flw ft1, -16(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -16(s0) | |
| flw ft1, -12(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -12(s0) | |
| flw ft1, -8(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -8(s0) | |
| flw ft1, -4(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -4(s0) | |
| flw ft1, 0(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 0(s0) | |
| flw ft1, 4(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 4(s0) | |
| flw ft1, 8(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 8(s0) | |
| flw ft1, 12(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 12(s0) | |
| flw ft1, 16(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 16(s0) | |
| flw ft1, 20(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 20(s0) | |
| flw ft1, 24(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 24(s0) | |
| flw ft1, 28(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 28(s0) | |
| flw ft1, 32(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 32(s0) | |
| flw ft1, 36(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 36(s0) | |
| flw ft1, 40(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 40(s0) | |
| flw ft1, 44(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 44(s0) | |
| flw ft1, 48(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 48(s0) | |
| flw ft1, 52(a2) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 52(s0) | |
| addi a5, a5, 112 | |
| addi a4, a4, -1 | |
| bnez a4, .LBB3_28 | |
| # %bb.29: # %for_end53 | |
| # in Loop: Header=BB3_27 Depth=1 | |
| add s1, s1, a7 | |
| addi a3, a3, 1 | |
| bne a3, a6, .LBB3_27 | |
| # %bb.30: # %for_end50 | |
| call _ZdaPv | |
| mv a0, s3 | |
| call _ZdaPv | |
| ld a0, 40(sp) | |
| call _ZdaPv | |
| mv a0, s2 | |
| call _ZdaPv | |
| ld s11, 312(sp) | |
| ld s10, 320(sp) | |
| ld s9, 328(sp) | |
| ld s8, 336(sp) | |
| ld s7, 344(sp) | |
| ld s6, 352(sp) | |
| ld s5, 360(sp) | |
| ld s4, 368(sp) | |
| ld s3, 376(sp) | |
| ld s2, 384(sp) | |
| ld s1, 392(sp) | |
| ld s0, 400(sp) | |
| ld ra, 408(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| .cfi_restore s2 | |
| .cfi_restore s3 | |
| .cfi_restore s4 | |
| .cfi_restore s5 | |
| .cfi_restore s6 | |
| .cfi_restore s7 | |
| .cfi_restore s8 | |
| .cfi_restore s9 | |
| .cfi_restore s10 | |
| .cfi_restore s11 | |
| addi sp, sp, 416 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .Lfunc_end3: | |
| .size fuse_conv2d_compute_, .Lfunc_end3-fuse_conv2d_compute_ | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_relu # -- Begin function fuse_relu | |
| .p2align 2 | |
| .type fuse_relu,@function | |
| fuse_relu: # @fuse_relu | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| .cfi_def_cfa_offset 32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB4_30 | |
| # %bb.1: # %assert_end | |
| lwu a4, 4(a1) | |
| ld a2, 8(a0) | |
| lwu a3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t0, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB4_3 | |
| # %bb.2: # %if_then | |
| lw a0, 0(a0) | |
| addi s0, zero, 1 | |
| bne a0, s0, .LBB4_31 | |
| .LBB4_3: # %if_end | |
| ld a7, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld s0, 32(a2) | |
| beqz s0, .LBB4_5 | |
| # %bb.4: # %if_then3 | |
| lw s0, 0(s0) | |
| addi s1, zero, 1 | |
| bne s0, s1, .LBB4_32 | |
| .LBB4_5: # %if_end4 | |
| addi s1, zero, 13 | |
| bltu s1, a3, .LBB4_25 | |
| # %bb.6: # %if_end4 | |
| addi s1, zero, 1 | |
| sll a3, s1, a3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB4_25 | |
| # %bb.7: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, a4, .LBB4_26 | |
| # %bb.8: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, a4 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a4, a4, s1 | |
| beqz a4, .LBB4_26 | |
| # %bb.9: # %assert_end10 | |
| bne t1, a3, .LBB4_33 | |
| # %bb.10: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB4_34 | |
| # %bb.11: # %assert_end14 | |
| lhu a3, 22(a5) | |
| bne a3, s0, .LBB4_35 | |
| # %bb.12: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB4_35 | |
| # %bb.13: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB4_35 | |
| # %bb.14: # %assert_end16 | |
| lui a3, 6 | |
| addiw a3, a3, 512 | |
| lw a4, 0(t0) | |
| bne a4, a3, .LBB4_36 | |
| # %bb.15: # %assert_end18 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB4_37 | |
| # %bb.16: # %assert_end20 | |
| lw a3, 16(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB4_38 | |
| # %bb.17: # %assert_end22 | |
| lhu a3, 22(a2) | |
| bne a3, s0, .LBB4_39 | |
| # %bb.18: # %assert_end22 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB4_39 | |
| # %bb.19: # %assert_end22 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB4_39 | |
| # %bb.20: # %assert_end24 | |
| lui a3, 6 | |
| addiw a3, a3, 512 | |
| lw a4, 0(a7) | |
| bne a4, a3, .LBB4_40 | |
| # %bb.21: # %assert_end26 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB4_41 | |
| # %bb.22: # %assert_end28 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB4_42 | |
| # %bb.23: # %assert_end30 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB4_44 | |
| # %bb.24: # %assert_end32 | |
| call fuse_relu_compute_ | |
| mv a0, zero | |
| j .LBB4_29 | |
| .LBB4_25: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.54) | |
| addi a0, a0, %lo(.L.str.54) | |
| j .LBB4_27 | |
| .LBB4_26: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.55) | |
| addi a0, a0, %lo(.L.str.55) | |
| .LBB4_27: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB4_28: # %assert_fail1 | |
| addi a0, a0, -1 | |
| .LBB4_29: # %assert_fail1 | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| addi sp, sp, 32 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB4_30: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.51) | |
| addi a0, a0, %lo(.L.str.51) | |
| j .LBB4_27 | |
| .LBB4_31: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.52) | |
| addi a0, a0, %lo(.L.str.52) | |
| j .LBB4_43 | |
| .LBB4_32: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.53) | |
| addi a0, a0, %lo(.L.str.53) | |
| jalr a1 | |
| slli a0, s1, 32 | |
| j .LBB4_28 | |
| .LBB4_33: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB4_27 | |
| .LBB4_34: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.56) | |
| addi a0, a0, %lo(.L.str.56) | |
| j .LBB4_43 | |
| .LBB4_35: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB4_27 | |
| .LBB4_36: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.57) | |
| addi a0, a0, %lo(.L.str.57) | |
| j .LBB4_27 | |
| .LBB4_37: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB4_27 | |
| .LBB4_38: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.58) | |
| addi a0, a0, %lo(.L.str.58) | |
| j .LBB4_43 | |
| .LBB4_39: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB4_27 | |
| .LBB4_40: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.59) | |
| addi a0, a0, %lo(.L.str.59) | |
| j .LBB4_27 | |
| .LBB4_41: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB4_27 | |
| .LBB4_42: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB4_43: # %assert_fail1 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB4_28 | |
| .LBB4_44: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB4_27 | |
| .Lfunc_end4: | |
| .size fuse_relu, .Lfunc_end4-fuse_relu | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_relu_compute_ | |
| .LCPI5_0: | |
| .word 0 # float 0 | |
| .text | |
| .globl fuse_relu_compute_ | |
| .p2align 2 | |
| .type fuse_relu_compute_,@function | |
| fuse_relu_compute_: # @fuse_relu_compute_ | |
| # %bb.0: # %entry | |
| lui a2, 6 | |
| addiw a2, a2, 512 | |
| lui a3, %hi(.LCPI5_0) | |
| addi a3, a3, %lo(.LCPI5_0) | |
| flw ft0, 0(a3) | |
| .LBB5_1: # %for_body | |
| # =>This Inner Loop Header: Depth=1 | |
| flw ft1, 0(a1) | |
| fmax.s ft1, ft1, ft0 | |
| fsw ft1, 0(a0) | |
| addi a1, a1, 4 | |
| addi a0, a0, 4 | |
| addi a2, a2, -1 | |
| bnez a2, .LBB5_1 | |
| # %bb.2: # %for_end | |
| ret | |
| .Lfunc_end5: | |
| .size fuse_relu_compute_, .Lfunc_end5-fuse_relu_compute_ | |
| # -- End function | |
| .globl fuse_max_pool2d # -- Begin function fuse_max_pool2d | |
| .p2align 2 | |
| .type fuse_max_pool2d,@function | |
| fuse_max_pool2d: # @fuse_max_pool2d | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -16 | |
| .cfi_def_cfa_offset 16 | |
| sd ra, 8(sp) | |
| sd s0, 0(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB6_42 | |
| # %bb.1: # %assert_end | |
| lwu t0, 4(a1) | |
| ld a2, 8(a0) | |
| lwu t3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t2, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB6_6 | |
| # %bb.2: # %if_then | |
| lui a3, 6 | |
| addiw a3, a3, 512 | |
| lw s0, 0(a0) | |
| bne s0, a3, .LBB6_43 | |
| # %bb.3: # %if_then | |
| ld a3, 8(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 784 | |
| bne a3, s0, .LBB6_43 | |
| # %bb.4: # %if_then | |
| ld a3, 16(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 28 | |
| bne a3, s0, .LBB6_43 | |
| # %bb.5: # %if_then | |
| ld a0, 24(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a3, zero, 1 | |
| bne a0, a3, .LBB6_43 | |
| .LBB6_6: # %if_end | |
| ld a7, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld a3, 32(a2) | |
| beqz a3, .LBB6_11 | |
| # %bb.7: # %if_then3 | |
| lui s0, 2 | |
| addiw s0, s0, -1920 | |
| lw a4, 0(a3) | |
| bne a4, s0, .LBB6_44 | |
| # %bb.8: # %if_then3 | |
| ld a4, 8(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| addi s0, zero, 196 | |
| bne a4, s0, .LBB6_44 | |
| # %bb.9: # %if_then3 | |
| ld a4, 16(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| addi s0, zero, 14 | |
| bne a4, s0, .LBB6_44 | |
| # %bb.10: # %if_then3 | |
| ld a3, 24(a3) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi a4, zero, 1 | |
| bne a3, a4, .LBB6_44 | |
| .LBB6_11: # %if_end4 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB6_37 | |
| # %bb.12: # %if_end4 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui a4, 2 | |
| addiw a4, a4, 152 | |
| and a3, a3, a4 | |
| beqz a3, .LBB6_37 | |
| # %bb.13: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t0, .LBB6_38 | |
| # %bb.14: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, t0 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a4, a4, s0 | |
| beqz a4, .LBB6_38 | |
| # %bb.15: # %assert_end10 | |
| bne t1, a3, .LBB6_45 | |
| # %bb.16: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi a4, zero, 4 | |
| bne a3, a4, .LBB6_46 | |
| # %bb.17: # %assert_end14 | |
| lhu a3, 22(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB6_47 | |
| # %bb.18: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB6_47 | |
| # %bb.19: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB6_47 | |
| # %bb.20: # %assert_end16 | |
| lw a3, 0(t2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB6_48 | |
| # %bb.21: # %assert_end18 | |
| lw a3, 8(t2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB6_49 | |
| # %bb.22: # %assert_end20 | |
| lw a4, 16(t2) | |
| addi a3, zero, 28 | |
| bne a4, a3, .LBB6_50 | |
| # %bb.23: # %assert_end22 | |
| lw a4, 24(t2) | |
| bne a4, a3, .LBB6_51 | |
| # %bb.24: # %assert_end24 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB6_52 | |
| # %bb.25: # %assert_end26 | |
| lw a3, 16(a2) | |
| addi a4, zero, 4 | |
| bne a3, a4, .LBB6_53 | |
| # %bb.26: # %assert_end28 | |
| lhu a3, 22(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB6_54 | |
| # %bb.27: # %assert_end28 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB6_54 | |
| # %bb.28: # %assert_end28 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB6_54 | |
| # %bb.29: # %assert_end30 | |
| lw a3, 0(a7) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB6_55 | |
| # %bb.30: # %assert_end32 | |
| lw a3, 8(a7) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB6_56 | |
| # %bb.31: # %assert_end34 | |
| lw a4, 16(a7) | |
| addi a3, zero, 14 | |
| bne a4, a3, .LBB6_57 | |
| # %bb.32: # %assert_end36 | |
| lw a4, 24(a7) | |
| bne a4, a3, .LBB6_58 | |
| # %bb.33: # %assert_end38 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB6_59 | |
| # %bb.34: # %assert_end40 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB6_60 | |
| # %bb.35: # %assert_end42 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB6_62 | |
| # %bb.36: # %assert_end44 | |
| call fuse_max_pool2d_compute_ | |
| mv a0, zero | |
| j .LBB6_41 | |
| .LBB6_37: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.63) | |
| addi a0, a0, %lo(.L.str.63) | |
| j .LBB6_39 | |
| .LBB6_38: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.64) | |
| addi a0, a0, %lo(.L.str.64) | |
| .LBB6_39: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB6_40: # %assert_fail15 | |
| addi a0, a0, -1 | |
| .LBB6_41: # %assert_fail15 | |
| ld s0, 0(sp) | |
| ld ra, 8(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| addi sp, sp, 16 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB6_42: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.60) | |
| addi a0, a0, %lo(.L.str.60) | |
| j .LBB6_39 | |
| .LBB6_43: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.61) | |
| addi a0, a0, %lo(.L.str.61) | |
| j .LBB6_39 | |
| .LBB6_44: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.62) | |
| addi a0, a0, %lo(.L.str.62) | |
| j .LBB6_39 | |
| .LBB6_45: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB6_39 | |
| .LBB6_46: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.29) | |
| addi a0, a0, %lo(.L.str.29) | |
| j .LBB6_39 | |
| .LBB6_47: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB6_61 | |
| .LBB6_48: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB6_61 | |
| .LBB6_49: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.65) | |
| addi a0, a0, %lo(.L.str.65) | |
| j .LBB6_39 | |
| .LBB6_50: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.31) | |
| addi a0, a0, %lo(.L.str.31) | |
| j .LBB6_39 | |
| .LBB6_51: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.32) | |
| addi a0, a0, %lo(.L.str.32) | |
| j .LBB6_39 | |
| .LBB6_52: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB6_39 | |
| .LBB6_53: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.11) | |
| addi a0, a0, %lo(.L.str.11) | |
| j .LBB6_39 | |
| .LBB6_54: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB6_61 | |
| .LBB6_55: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.13) | |
| addi a0, a0, %lo(.L.str.13) | |
| j .LBB6_61 | |
| .LBB6_56: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.66) | |
| addi a0, a0, %lo(.L.str.66) | |
| j .LBB6_39 | |
| .LBB6_57: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.67) | |
| addi a0, a0, %lo(.L.str.67) | |
| j .LBB6_39 | |
| .LBB6_58: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.68) | |
| addi a0, a0, %lo(.L.str.68) | |
| j .LBB6_39 | |
| .LBB6_59: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB6_39 | |
| .LBB6_60: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB6_61: # %assert_fail15 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB6_40 | |
| .LBB6_62: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB6_39 | |
| .Lfunc_end6: | |
| .size fuse_max_pool2d, .Lfunc_end6-fuse_max_pool2d | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_max_pool2d_compute_ | |
| .LCPI7_0: | |
| .word 4286578687 # float -3.40282347E+38 | |
| .text | |
| .globl fuse_max_pool2d_compute_ | |
| .p2align 2 | |
| .type fuse_max_pool2d_compute_,@function | |
| fuse_max_pool2d_compute_: # @fuse_max_pool2d_compute_ | |
| # %bb.0: # %entry | |
| addi t0, a1, 4 | |
| lui a1, %hi(.LCPI7_0) | |
| addi a1, a1, %lo(.LCPI7_0) | |
| flw ft0, 0(a1) | |
| addi a2, zero, 56 | |
| addi t2, zero, 14 | |
| lui a1, 1 | |
| addiw a7, a1, -960 | |
| addi a6, zero, 32 | |
| mv t1, zero | |
| j .LBB7_2 | |
| .LBB7_1: # %for_end3 | |
| # in Loop: Header=BB7_2 Depth=1 | |
| add t0, t0, a7 | |
| addi a0, a0, 784 | |
| addi t1, t1, 1 | |
| beq t1, a6, .LBB7_14 | |
| .LBB7_2: # %for_begin1.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB7_4 Depth 2 | |
| # Child Loop BB7_6 Depth 3 | |
| mv t3, t0 | |
| mv a4, a0 | |
| mv t4, zero | |
| j .LBB7_4 | |
| .LBB7_3: # %for_end6 | |
| # in Loop: Header=BB7_4 Depth=2 | |
| addi t3, t3, 224 | |
| addi a4, a4, 56 | |
| addi t4, t4, 1 | |
| beq t4, t2, .LBB7_1 | |
| .LBB7_4: # %for_begin4.preheader | |
| # Parent Loop BB7_2 Depth=1 | |
| # => This Loop Header: Depth=2 | |
| # Child Loop BB7_6 Depth 3 | |
| mv a1, t3 | |
| mv a3, zero | |
| j .LBB7_6 | |
| .LBB7_5: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| add a5, a4, a3 | |
| fsw ft1, 0(a5) | |
| addi a1, a1, 8 | |
| addi a3, a3, 4 | |
| beq a3, a2, .LBB7_3 | |
| .LBB7_6: # %for_body5 | |
| # Parent Loop BB7_2 Depth=1 | |
| # Parent Loop BB7_4 Depth=2 | |
| # => This Inner Loop Header: Depth=3 | |
| flw ft2, -4(a1) | |
| flt.s a5, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a5, .LBB7_8 | |
| # %bb.7: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| fmv.s ft1, ft2 | |
| .LBB7_8: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| flw ft2, 0(a1) | |
| flt.s a5, ft2, ft1 | |
| bnez a5, .LBB7_10 | |
| # %bb.9: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| fmv.s ft1, ft2 | |
| .LBB7_10: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| flw ft2, 108(a1) | |
| flt.s a5, ft2, ft1 | |
| bnez a5, .LBB7_12 | |
| # %bb.11: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| fmv.s ft1, ft2 | |
| .LBB7_12: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| flw ft2, 112(a1) | |
| flt.s a5, ft2, ft1 | |
| bnez a5, .LBB7_5 | |
| # %bb.13: # %for_body5 | |
| # in Loop: Header=BB7_6 Depth=3 | |
| fmv.s ft1, ft2 | |
| j .LBB7_5 | |
| .LBB7_14: # %for_end | |
| ret | |
| .Lfunc_end7: | |
| .size fuse_max_pool2d_compute_, .Lfunc_end7-fuse_max_pool2d_compute_ | |
| # -- End function | |
| .globl fuse_conv2d_1 # -- Begin function fuse_conv2d_1 | |
| .p2align 2 | |
| .type fuse_conv2d_1,@function | |
| fuse_conv2d_1: # @fuse_conv2d_1 | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -64 | |
| .cfi_def_cfa_offset 64 | |
| sd ra, 56(sp) | |
| sd s0, 48(sp) | |
| sd s1, 40(sp) | |
| sd s2, 32(sp) | |
| sd s3, 24(sp) | |
| sd s4, 16(sp) | |
| sd s5, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| .cfi_offset s2, -32 | |
| .cfi_offset s3, -40 | |
| .cfi_offset s4, -48 | |
| .cfi_offset s5, -56 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 4 | |
| bne a2, a3, .LBB8_74 | |
| # %bb.1: # %assert_end | |
| lwu t5, 12(a1) | |
| ld a6, 24(a0) | |
| lwu t6, 8(a1) | |
| ld a7, 16(a0) | |
| lwu s3, 4(a1) | |
| ld t3, 8(a0) | |
| lwu s4, 0(a1) | |
| ld s5, 0(a0) | |
| ld t4, 24(s5) | |
| ld a0, 0(s5) | |
| ld a1, 32(s5) | |
| beqz a1, .LBB8_6 | |
| # %bb.2: # %if_then | |
| lui a2, 2 | |
| addiw a2, a2, -1920 | |
| lw a3, 0(a1) | |
| bne a3, a2, .LBB8_75 | |
| # %bb.3: # %if_then | |
| ld a2, 8(a1) | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 196 | |
| bne a2, a3, .LBB8_75 | |
| # %bb.4: # %if_then | |
| ld a2, 16(a1) | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 14 | |
| bne a2, a3, .LBB8_75 | |
| # %bb.5: # %if_then | |
| ld a1, 24(a1) | |
| slli a1, a1, 32 | |
| srli a1, a1, 32 | |
| addi a2, zero, 1 | |
| bne a1, a2, .LBB8_75 | |
| .LBB8_6: # %if_end | |
| ld t2, 24(t3) | |
| ld a1, 0(t3) | |
| lwu a4, 12(s5) | |
| lwu s2, 8(s5) | |
| ld a2, 32(t3) | |
| beqz a2, .LBB8_11 | |
| # %bb.7: # %if_then3 | |
| lw a3, 0(a2) | |
| addi s0, zero, 800 | |
| bne a3, s0, .LBB8_76 | |
| # %bb.8: # %if_then3 | |
| ld a3, 8(a2) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 25 | |
| bne a3, s0, .LBB8_76 | |
| # %bb.9: # %if_then3 | |
| ld a3, 16(a2) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 5 | |
| bne a3, s0, .LBB8_76 | |
| # %bb.10: # %if_then3 | |
| ld a2, 24(a2) | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 1 | |
| bne a2, a3, .LBB8_76 | |
| .LBB8_11: # %if_end4 | |
| ld t1, 24(a7) | |
| ld a3, 0(a7) | |
| ld a2, 32(a7) | |
| beqz a2, .LBB8_13 | |
| # %bb.12: # %if_then7 | |
| lw a2, 0(a2) | |
| addi s0, zero, 1 | |
| bne a2, s0, .LBB8_77 | |
| .LBB8_13: # %if_end8 | |
| ld t0, 24(a6) | |
| ld a2, 0(a6) | |
| ld s0, 32(a6) | |
| beqz s0, .LBB8_18 | |
| # %bb.14: # %if_then11 | |
| lui s1, 3 | |
| addiw s1, s1, 256 | |
| lw a5, 0(s0) | |
| bne a5, s1, .LBB8_78 | |
| # %bb.15: # %if_then11 | |
| ld a5, 8(s0) | |
| slli a5, a5, 32 | |
| srli a5, a5, 32 | |
| addi s1, zero, 196 | |
| bne a5, s1, .LBB8_78 | |
| # %bb.16: # %if_then11 | |
| ld a5, 16(s0) | |
| slli a5, a5, 32 | |
| srli a5, a5, 32 | |
| addi s1, zero, 14 | |
| bne a5, s1, .LBB8_78 | |
| # %bb.17: # %if_then11 | |
| ld a5, 24(s0) | |
| slli a5, a5, 32 | |
| srli a5, a5, 32 | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB8_78 | |
| .LBB8_18: # %if_end12 | |
| addi a5, zero, 13 | |
| bltu a5, s4, .LBB8_67 | |
| # %bb.19: # %if_end12 | |
| addi a5, zero, 1 | |
| sll a5, a5, s4 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a5, a5, s0 | |
| beqz a5, .LBB8_67 | |
| # %bb.20: # %assert_end16 | |
| addi a5, zero, 13 | |
| bltu a5, s3, .LBB8_68 | |
| # %bb.21: # %assert_end16 | |
| addi a5, zero, 1 | |
| sll a5, a5, s3 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a5, a5, s0 | |
| beqz a5, .LBB8_68 | |
| # %bb.22: # %assert_end18 | |
| addi a5, zero, 13 | |
| bltu a5, t6, .LBB8_69 | |
| # %bb.23: # %assert_end18 | |
| addi a5, zero, 1 | |
| sll a5, a5, t6 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a5, a5, s1 | |
| beqz a5, .LBB8_69 | |
| # %bb.24: # %assert_end20 | |
| addi a5, zero, 13 | |
| bltu a5, t5, .LBB8_70 | |
| # %bb.25: # %assert_end20 | |
| addi s1, zero, 1 | |
| sll a5, s1, t5 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a5, a5, s0 | |
| beqz a5, .LBB8_70 | |
| # %bb.26: # %assert_end22 | |
| bne s2, s1, .LBB8_79 | |
| # %bb.27: # %assert_end24 | |
| lw a5, 16(s5) | |
| addi s1, zero, 4 | |
| bne a5, s1, .LBB8_80 | |
| # %bb.28: # %assert_end26 | |
| lhu a5, 22(s5) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB8_81 | |
| # %bb.29: # %assert_end26 | |
| lbu a5, 21(s5) | |
| addi s1, zero, 32 | |
| bne a5, s1, .LBB8_81 | |
| # %bb.30: # %assert_end26 | |
| lbu a5, 20(s5) | |
| addi s1, zero, 2 | |
| bne a5, s1, .LBB8_81 | |
| # %bb.31: # %assert_end28 | |
| lw a5, 0(t4) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB8_82 | |
| # %bb.32: # %assert_end30 | |
| lw a5, 8(t4) | |
| addi s1, zero, 32 | |
| bne a5, s1, .LBB8_83 | |
| # %bb.33: # %assert_end32 | |
| lw a5, 16(t4) | |
| addi s1, zero, 14 | |
| bne a5, s1, .LBB8_84 | |
| # %bb.34: # %assert_end34 | |
| lw a5, 24(t4) | |
| bne a5, s1, .LBB8_85 | |
| # %bb.35: # %assert_end36 | |
| ld a5, 40(s5) | |
| bnez a5, .LBB8_86 | |
| # %bb.36: # %assert_end38 | |
| lw a5, 16(t3) | |
| addi s1, zero, 4 | |
| bne a5, s1, .LBB8_87 | |
| # %bb.37: # %assert_end40 | |
| lhu a5, 22(t3) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB8_88 | |
| # %bb.38: # %assert_end40 | |
| lbu a5, 21(t3) | |
| addi s1, zero, 32 | |
| bne a5, s1, .LBB8_88 | |
| # %bb.39: # %assert_end40 | |
| lbu a5, 20(t3) | |
| addi s1, zero, 2 | |
| bne a5, s1, .LBB8_88 | |
| # %bb.40: # %assert_end42 | |
| lw a5, 0(t2) | |
| addi s1, zero, 64 | |
| bne a5, s1, .LBB8_89 | |
| # %bb.41: # %assert_end44 | |
| lw a5, 8(t2) | |
| addi s1, zero, 32 | |
| bne a5, s1, .LBB8_90 | |
| # %bb.42: # %assert_end46 | |
| lw s1, 16(t2) | |
| addi a5, zero, 5 | |
| bne s1, a5, .LBB8_91 | |
| # %bb.43: # %assert_end48 | |
| lw s1, 24(t2) | |
| bne s1, a5, .LBB8_92 | |
| # %bb.44: # %assert_end50 | |
| ld a5, 40(t3) | |
| bnez a5, .LBB8_93 | |
| # %bb.45: # %assert_end52 | |
| lw a5, 8(t3) | |
| addi s0, zero, 1 | |
| bne a5, s0, .LBB8_94 | |
| # %bb.46: # %assert_end54 | |
| lw s1, 12(t3) | |
| sext.w a5, a4 | |
| bne a5, s1, .LBB8_95 | |
| # %bb.47: # %assert_end56 | |
| lw s1, 16(a7) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB8_96 | |
| # %bb.48: # %assert_end58 | |
| lhu s1, 22(a7) | |
| bne s1, s0, .LBB8_97 | |
| # %bb.49: # %assert_end58 | |
| lbu s1, 21(a7) | |
| addi s0, zero, 32 | |
| bne s1, s0, .LBB8_97 | |
| # %bb.50: # %assert_end58 | |
| lbu s1, 20(a7) | |
| addi s0, zero, 2 | |
| bne s1, s0, .LBB8_97 | |
| # %bb.51: # %assert_end60 | |
| lw s1, 0(t1) | |
| addi s0, zero, 64 | |
| bne s1, s0, .LBB8_98 | |
| # %bb.52: # %assert_end62 | |
| ld s1, 40(a7) | |
| bnez s1, .LBB8_99 | |
| # %bb.53: # %assert_end64 | |
| lw s1, 8(a7) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB8_100 | |
| # %bb.54: # %assert_end66 | |
| lw s1, 12(a7) | |
| bne a5, s1, .LBB8_101 | |
| # %bb.55: # %assert_end68 | |
| lw s1, 16(a6) | |
| addi s0, zero, 4 | |
| bne s1, s0, .LBB8_102 | |
| # %bb.56: # %assert_end70 | |
| lhu s1, 22(a6) | |
| addi s2, zero, 1 | |
| bne s1, s2, .LBB8_103 | |
| # %bb.57: # %assert_end70 | |
| lbu s1, 21(a6) | |
| addi s0, zero, 32 | |
| bne s1, s0, .LBB8_103 | |
| # %bb.58: # %assert_end70 | |
| lbu s1, 20(a6) | |
| addi s0, zero, 2 | |
| bne s1, s0, .LBB8_103 | |
| # %bb.59: # %assert_end72 | |
| lw s1, 0(t0) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB8_104 | |
| # %bb.60: # %assert_end74 | |
| lw s1, 8(t0) | |
| addi s0, zero, 64 | |
| bne s1, s0, .LBB8_105 | |
| # %bb.61: # %assert_end76 | |
| lw s0, 16(t0) | |
| addi s1, zero, 14 | |
| bne s0, s1, .LBB8_106 | |
| # %bb.62: # %assert_end78 | |
| lw s0, 24(t0) | |
| bne s0, s1, .LBB8_107 | |
| # %bb.63: # %assert_end80 | |
| ld s1, 40(a6) | |
| bnez s1, .LBB8_108 | |
| # %bb.64: # %assert_end82 | |
| lw s1, 8(a6) | |
| addi s0, zero, 1 | |
| bne s1, s0, .LBB8_109 | |
| # %bb.65: # %assert_end84 | |
| lw s1, 12(a6) | |
| bne a5, s1, .LBB8_111 | |
| # %bb.66: # %assert_end86 | |
| call fuse_conv2d_1_compute_ | |
| mv a0, zero | |
| j .LBB8_73 | |
| .LBB8_67: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.73) | |
| addi a0, a0, %lo(.L.str.73) | |
| j .LBB8_71 | |
| .LBB8_68: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.74) | |
| addi a0, a0, %lo(.L.str.74) | |
| j .LBB8_71 | |
| .LBB8_69: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.75) | |
| addi a0, a0, %lo(.L.str.75) | |
| j .LBB8_71 | |
| .LBB8_70: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.76) | |
| addi a0, a0, %lo(.L.str.76) | |
| .LBB8_71: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB8_72: # %assert_fail9 | |
| addi a0, a0, -1 | |
| .LBB8_73: # %assert_fail9 | |
| ld s5, 8(sp) | |
| ld s4, 16(sp) | |
| ld s3, 24(sp) | |
| ld s2, 32(sp) | |
| ld s1, 40(sp) | |
| ld s0, 48(sp) | |
| ld ra, 56(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| .cfi_restore s2 | |
| .cfi_restore s3 | |
| .cfi_restore s4 | |
| .cfi_restore s5 | |
| addi sp, sp, 64 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB8_74: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.69) | |
| addi a0, a0, %lo(.L.str.69) | |
| j .LBB8_71 | |
| .LBB8_75: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.70) | |
| addi a0, a0, %lo(.L.str.70) | |
| j .LBB8_71 | |
| .LBB8_76: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.71) | |
| addi a0, a0, %lo(.L.str.71) | |
| j .LBB8_71 | |
| .LBB8_77: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.23) | |
| addi a0, a0, %lo(.L.str.23) | |
| j .LBB8_110 | |
| .LBB8_78: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.72) | |
| addi a0, a0, %lo(.L.str.72) | |
| j .LBB8_71 | |
| .LBB8_79: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB8_71 | |
| .LBB8_80: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.29) | |
| addi a0, a0, %lo(.L.str.29) | |
| j .LBB8_71 | |
| .LBB8_81: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB8_110 | |
| .LBB8_82: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB8_110 | |
| .LBB8_83: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.65) | |
| addi a0, a0, %lo(.L.str.65) | |
| j .LBB8_71 | |
| .LBB8_84: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.77) | |
| addi a0, a0, %lo(.L.str.77) | |
| j .LBB8_71 | |
| .LBB8_85: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.78) | |
| addi a0, a0, %lo(.L.str.78) | |
| j .LBB8_71 | |
| .LBB8_86: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB8_71 | |
| .LBB8_87: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.11) | |
| addi a0, a0, %lo(.L.str.11) | |
| j .LBB8_71 | |
| .LBB8_88: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB8_110 | |
| .LBB8_89: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.79) | |
| addi a0, a0, %lo(.L.str.79) | |
| j .LBB8_71 | |
| .LBB8_90: # %assert_fail45 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.66) | |
| addi a0, a0, %lo(.L.str.66) | |
| j .LBB8_71 | |
| .LBB8_91: # %assert_fail47 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.34) | |
| addi a0, a0, %lo(.L.str.34) | |
| j .LBB8_71 | |
| .LBB8_92: # %assert_fail49 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.35) | |
| addi a0, a0, %lo(.L.str.35) | |
| j .LBB8_71 | |
| .LBB8_93: # %assert_fail51 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB8_71 | |
| .LBB8_94: # %assert_fail53 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| j .LBB8_110 | |
| .LBB8_95: # %assert_fail55 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB8_71 | |
| .LBB8_96: # %assert_fail57 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.36) | |
| addi a0, a0, %lo(.L.str.36) | |
| j .LBB8_110 | |
| .LBB8_97: # %assert_fail59 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.37) | |
| addi a0, a0, %lo(.L.str.37) | |
| j .LBB8_71 | |
| .LBB8_98: # %assert_fail61 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.80) | |
| addi a0, a0, %lo(.L.str.80) | |
| j .LBB8_71 | |
| .LBB8_99: # %assert_fail63 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.39) | |
| addi a0, a0, %lo(.L.str.39) | |
| j .LBB8_71 | |
| .LBB8_100: # %assert_fail65 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.40) | |
| addi a0, a0, %lo(.L.str.40) | |
| j .LBB8_110 | |
| .LBB8_101: # %assert_fail67 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.41) | |
| addi a0, a0, %lo(.L.str.41) | |
| j .LBB8_71 | |
| .LBB8_102: # %assert_fail69 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.42) | |
| addi a0, a0, %lo(.L.str.42) | |
| j .LBB8_71 | |
| .LBB8_103: # %assert_fail71 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.43) | |
| addi a0, a0, %lo(.L.str.43) | |
| jalr a1 | |
| slli a0, s2, 32 | |
| j .LBB8_72 | |
| .LBB8_104: # %assert_fail73 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.44) | |
| addi a0, a0, %lo(.L.str.44) | |
| j .LBB8_110 | |
| .LBB8_105: # %assert_fail75 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.81) | |
| addi a0, a0, %lo(.L.str.81) | |
| j .LBB8_71 | |
| .LBB8_106: # %assert_fail77 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.82) | |
| addi a0, a0, %lo(.L.str.82) | |
| j .LBB8_71 | |
| .LBB8_107: # %assert_fail79 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.83) | |
| addi a0, a0, %lo(.L.str.83) | |
| j .LBB8_71 | |
| .LBB8_108: # %assert_fail81 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.48) | |
| addi a0, a0, %lo(.L.str.48) | |
| j .LBB8_71 | |
| .LBB8_109: # %assert_fail83 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.49) | |
| addi a0, a0, %lo(.L.str.49) | |
| .LBB8_110: # %assert_fail9 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB8_72 | |
| .LBB8_111: # %assert_fail85 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.50) | |
| addi a0, a0, %lo(.L.str.50) | |
| j .LBB8_71 | |
| .Lfunc_end8: | |
| .size fuse_conv2d_1, .Lfunc_end8-fuse_conv2d_1 | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_conv2d_1_compute_ # -- Begin function fuse_conv2d_1_compute_ | |
| .p2align 2 | |
| .type fuse_conv2d_1_compute_,@function | |
| fuse_conv2d_1_compute_: # @fuse_conv2d_1_compute_ | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -320 | |
| .cfi_def_cfa_offset 320 | |
| sd ra, 312(sp) | |
| sd s0, 304(sp) | |
| sd s1, 296(sp) | |
| sd s2, 288(sp) | |
| sd s3, 280(sp) | |
| sd s4, 272(sp) | |
| sd s5, 264(sp) | |
| sd s6, 256(sp) | |
| sd s7, 248(sp) | |
| sd s8, 240(sp) | |
| sd s9, 232(sp) | |
| sd s10, 224(sp) | |
| sd s11, 216(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| .cfi_offset s2, -32 | |
| .cfi_offset s3, -40 | |
| .cfi_offset s4, -48 | |
| .cfi_offset s5, -56 | |
| .cfi_offset s6, -64 | |
| .cfi_offset s7, -72 | |
| .cfi_offset s8, -80 | |
| .cfi_offset s9, -88 | |
| .cfi_offset s10, -96 | |
| .cfi_offset s11, -104 | |
| sd a3, 32(sp) | |
| sd a2, 24(sp) | |
| mv s11, a1 | |
| mv s6, a0 | |
| lui a0, 50 | |
| call _Znam | |
| mv s0, a0 | |
| lui a0, 10 | |
| addiw a0, a0, 512 | |
| call _Znam | |
| mv s8, a0 | |
| lui a0, 12 | |
| addiw a0, a0, 1024 | |
| call _Znam | |
| mv s9, a0 | |
| addi s2, s6, -112 | |
| sd s0, 56(sp) | |
| addi s4, s0, 36 | |
| addi s5, zero, 14 | |
| addi s6, zero, 18 | |
| addi s7, zero, 32 | |
| mv s3, zero | |
| .LBB9_1: # %for_begin5.preheader | |
| # =>This Inner Loop Header: Depth=1 | |
| mv s0, s2 | |
| mv s1, s4 | |
| mv s10, zero | |
| addiw a0, s10, -2 | |
| bltu a0, s5, .LBB9_5 | |
| .LBB9_2: # %for_body9.preheader | |
| # in Loop: Header=BB9_1 Depth=1 | |
| addi a0, s1, -36 | |
| mv a1, zero | |
| addi a2, zero, 72 | |
| call memset | |
| .LBB9_3: # %for_end10 | |
| # in Loop: Header=BB9_1 Depth=1 | |
| addi s0, s0, 56 | |
| addi s1, s1, 72 | |
| addi s10, s10, 1 | |
| beq s10, s6, .LBB9_6 | |
| # %bb.4: # %for_begin8.preheader | |
| # in Loop: Header=BB9_1 Depth=1 | |
| addiw a0, s10, -2 | |
| bgeu a0, s5, .LBB9_2 | |
| .LBB9_5: # %if_end12.us.17 | |
| # in Loop: Header=BB9_1 Depth=1 | |
| sw zero, -32(s1) | |
| sw zero, -36(s1) | |
| flw ft0, 0(s0) | |
| fsw ft0, -28(s1) | |
| flw ft0, 4(s0) | |
| fsw ft0, -24(s1) | |
| flw ft0, 8(s0) | |
| fsw ft0, -20(s1) | |
| flw ft0, 12(s0) | |
| fsw ft0, -16(s1) | |
| flw ft0, 16(s0) | |
| fsw ft0, -12(s1) | |
| flw ft0, 20(s0) | |
| fsw ft0, -8(s1) | |
| flw ft0, 24(s0) | |
| fsw ft0, -4(s1) | |
| flw ft0, 28(s0) | |
| fsw ft0, 0(s1) | |
| flw ft0, 32(s0) | |
| fsw ft0, 4(s1) | |
| flw ft0, 36(s0) | |
| fsw ft0, 8(s1) | |
| flw ft0, 40(s0) | |
| fsw ft0, 12(s1) | |
| flw ft0, 44(s0) | |
| fsw ft0, 16(s1) | |
| flw ft0, 48(s0) | |
| fsw ft0, 20(s1) | |
| flw ft0, 52(s0) | |
| sw zero, 32(s1) | |
| sw zero, 28(s1) | |
| fsw ft0, 24(s1) | |
| j .LBB9_3 | |
| .LBB9_6: # %for_end7 | |
| # in Loop: Header=BB9_1 Depth=1 | |
| addi s2, s2, 784 | |
| addi s4, s4, 1296 | |
| addi s3, s3, 1 | |
| bne s3, s7, .LBB9_1 | |
| # %bb.7: # %for_begin13.preheader | |
| ld a0, 56(sp) | |
| addi t0, a0, 36 | |
| addi a1, zero, 644 | |
| addi t3, zero, 18 | |
| lui a0, 3 | |
| addiw a7, a0, -1920 | |
| addi a6, zero, 4 | |
| mv t2, zero | |
| mv t1, zero | |
| .LBB9_8: # %for_begin16.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB9_9 Depth 2 | |
| # Child Loop BB9_10 Depth 3 | |
| mv a4, t0 | |
| mv a5, t2 | |
| mv a3, zero | |
| .LBB9_9: # %for_begin19.preheader | |
| # Parent Loop BB9_8 Depth=1 | |
| # => This Loop Header: Depth=2 | |
| # Child Loop BB9_10 Depth 3 | |
| add s0, s8, a5 | |
| addi s1, zero, 68 | |
| mv a0, a4 | |
| .LBB9_10: # %for_begin22.preheader | |
| # Parent Loop BB9_8 Depth=1 | |
| # Parent Loop BB9_9 Depth=2 | |
| # => This Inner Loop Header: Depth=3 | |
| add a2, s0, s1 | |
| flw ft0, -36(a0) | |
| fsw ft0, -68(a2) | |
| flw ft0, -32(a0) | |
| fsw ft0, -64(a2) | |
| flw ft0, -28(a0) | |
| fsw ft0, -60(a2) | |
| flw ft0, -24(a0) | |
| fsw ft0, -56(a2) | |
| flw ft0, -20(a0) | |
| fsw ft0, -52(a2) | |
| flw ft0, -16(a0) | |
| fsw ft0, -48(a2) | |
| flw ft0, -12(a0) | |
| fsw ft0, -44(a2) | |
| flw ft0, -8(a0) | |
| fsw ft0, -40(a2) | |
| flw ft0, -4(a0) | |
| fsw ft0, -36(a2) | |
| flw ft0, 0(a0) | |
| fsw ft0, -32(a2) | |
| flw ft0, 4(a0) | |
| fsw ft0, -28(a2) | |
| flw ft0, 8(a0) | |
| fsw ft0, -24(a2) | |
| flw ft0, 12(a0) | |
| fsw ft0, -20(a2) | |
| flw ft0, 16(a0) | |
| fsw ft0, -16(a2) | |
| flw ft0, 20(a0) | |
| fsw ft0, -12(a2) | |
| flw ft0, 24(a0) | |
| fsw ft0, -8(a2) | |
| flw ft0, 28(a0) | |
| fsw ft0, -4(a2) | |
| flw ft0, 32(a0) | |
| fsw ft0, 0(a2) | |
| addi a0, a0, 1296 | |
| addi s1, s1, 72 | |
| bne s1, a1, .LBB9_10 | |
| # %bb.11: # %for_end21 | |
| # in Loop: Header=BB9_9 Depth=2 | |
| addi a4, a4, 72 | |
| addi a5, a5, 576 | |
| addi a3, a3, 1 | |
| bne a3, t3, .LBB9_9 | |
| # %bb.12: # %for_end18 | |
| # in Loop: Header=BB9_8 Depth=1 | |
| add t0, t0, a7 | |
| add t2, t2, a7 | |
| addi t1, t1, 1 | |
| bne t1, a6, .LBB9_8 | |
| # %bb.13: # %for_begin25.preheader | |
| lui a0, 1 | |
| addiw a0, a0, -896 | |
| lui a1, 3 | |
| addiw a6, a1, 512 | |
| add t0, s11, a0 | |
| lui a0, 5 | |
| addiw a7, a0, 1920 | |
| addiw a0, a0, -1280 | |
| lui a3, 4 | |
| addiw a3, a3, -384 | |
| lui a4, 2 | |
| addiw a5, a4, 1408 | |
| addiw a4, a4, -1792 | |
| sd a4, 120(sp) | |
| add t1, s11, a4 | |
| add s2, s11, a5 | |
| add s4, s11, a6 | |
| add t5, s11, a3 | |
| add s1, s11, a0 | |
| add s6, s11, a7 | |
| ld a0, 56(sp) | |
| addi t6, a0, 16 | |
| addi a4, zero, 800 | |
| addi a5, zero, 5 | |
| lui a0, 6 | |
| addiw a0, a0, 1024 | |
| sd a0, 16(sp) | |
| mv a2, zero | |
| .LBB9_14: # %for_begin28.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB9_15 Depth 2 | |
| # Child Loop BB9_16 Depth 3 | |
| # Child Loop BB9_17 Depth 4 | |
| # Child Loop BB9_18 Depth 5 | |
| sd a2, 8(sp) | |
| sd t6, 40(sp) | |
| sd s11, 112(sp) | |
| mv s5, s11 | |
| sd t0, 104(sp) | |
| sd t1, 96(sp) | |
| sd s2, 88(sp) | |
| sd s4, 80(sp) | |
| sd t5, 72(sp) | |
| sd s1, 64(sp) | |
| mv a7, s1 | |
| sd s6, 48(sp) | |
| mv a2, zero | |
| .LBB9_15: # %for_begin31.preheader | |
| # Parent Loop BB9_14 Depth=1 | |
| # => This Loop Header: Depth=2 | |
| # Child Loop BB9_16 Depth 3 | |
| # Child Loop BB9_17 Depth 4 | |
| # Child Loop BB9_18 Depth 5 | |
| sd a2, 128(sp) | |
| sd t6, 200(sp) | |
| sd s5, 192(sp) | |
| sd t0, 184(sp) | |
| sd t1, 176(sp) | |
| sd s2, 168(sp) | |
| sd s4, 160(sp) | |
| sd t5, 152(sp) | |
| sd a7, 144(sp) | |
| sd s6, 136(sp) | |
| mv s7, zero | |
| .LBB9_16: # %for_begin34.preheader | |
| # Parent Loop BB9_14 Depth=1 | |
| # Parent Loop BB9_15 Depth=2 | |
| # => This Loop Header: Depth=3 | |
| # Child Loop BB9_17 Depth 4 | |
| # Child Loop BB9_18 Depth 5 | |
| sd t6, 208(sp) | |
| mv s11, s5 | |
| mv a2, t0 | |
| mv a1, t1 | |
| mv a3, s2 | |
| mv a0, s4 | |
| mv t2, t5 | |
| mv t3, a7 | |
| mv t4, s6 | |
| mv s1, zero | |
| .LBB9_17: # %for_begin37.preheader | |
| # Parent Loop BB9_14 Depth=1 | |
| # Parent Loop BB9_15 Depth=2 | |
| # Parent Loop BB9_16 Depth=3 | |
| # => This Loop Header: Depth=4 | |
| # Child Loop BB9_18 Depth 5 | |
| mv s10, t6 | |
| mv a6, zero | |
| .LBB9_18: # %for_begin40.preheader | |
| # Parent Loop BB9_14 Depth=1 | |
| # Parent Loop BB9_15 Depth=2 | |
| # Parent Loop BB9_16 Depth=3 | |
| # Parent Loop BB9_17 Depth=4 | |
| # => This Inner Loop Header: Depth=5 | |
| add s3, s11, a6 | |
| flw ft0, 0(s3) | |
| fsw ft0, -16(s10) | |
| add s0, a2, a6 | |
| flw ft0, 0(s0) | |
| fsw ft0, -12(s10) | |
| add s0, a1, a6 | |
| flw ft0, 0(s0) | |
| fsw ft0, -8(s10) | |
| add s0, a3, a6 | |
| flw ft0, 0(s0) | |
| fsw ft0, -4(s10) | |
| add s0, a0, a6 | |
| flw ft0, 0(s0) | |
| fsw ft0, 0(s10) | |
| add s0, t2, a6 | |
| flw ft0, 0(s0) | |
| fsw ft0, 4(s10) | |
| add s0, t3, a6 | |
| flw ft0, 0(s0) | |
| fsw ft0, 8(s10) | |
| add s0, t4, a6 | |
| flw ft0, 0(s0) | |
| fsw ft0, 12(s10) | |
| addi s10, s10, 32 | |
| addi a6, a6, 100 | |
| bne a6, a4, .LBB9_18 | |
| # %bb.19: # %for_end39 | |
| # in Loop: Header=BB9_17 Depth=4 | |
| addi t6, t6, 256 | |
| addi s11, s11, 4 | |
| addi a2, a2, 4 | |
| addi a1, a1, 4 | |
| addi a3, a3, 4 | |
| addi a0, a0, 4 | |
| addi t2, t2, 4 | |
| addi t3, t3, 4 | |
| addi t4, t4, 4 | |
| addi s1, s1, 1 | |
| bne s1, a5, .LBB9_17 | |
| # %bb.20: # %for_end36 | |
| # in Loop: Header=BB9_16 Depth=3 | |
| ld t6, 208(sp) | |
| addi t6, t6, 1280 | |
| addi s5, s5, 20 | |
| addi t0, t0, 20 | |
| addi t1, t1, 20 | |
| addi s2, s2, 20 | |
| addi s4, s4, 20 | |
| addi t5, t5, 20 | |
| addi a7, a7, 20 | |
| addi s6, s6, 20 | |
| addi s7, s7, 1 | |
| bne s7, a5, .LBB9_16 | |
| # %bb.21: # %for_end33 | |
| # in Loop: Header=BB9_15 Depth=2 | |
| ld a0, 120(sp) | |
| ld t6, 200(sp) | |
| add t6, t6, a0 | |
| ld s5, 192(sp) | |
| addi s5, s5, 800 | |
| ld t0, 184(sp) | |
| addi t0, t0, 800 | |
| ld t1, 176(sp) | |
| addi t1, t1, 800 | |
| ld s2, 168(sp) | |
| addi s2, s2, 800 | |
| ld s4, 160(sp) | |
| addi s4, s4, 800 | |
| ld t5, 152(sp) | |
| addi t5, t5, 800 | |
| ld a7, 144(sp) | |
| addi a7, a7, 800 | |
| ld s6, 136(sp) | |
| addi s6, s6, 800 | |
| ld a2, 128(sp) | |
| addi a2, a2, 1 | |
| addi a0, zero, 4 | |
| bne a2, a0, .LBB9_15 | |
| # %bb.22: # %for_end30 | |
| # in Loop: Header=BB9_14 Depth=1 | |
| ld t6, 40(sp) | |
| ld a0, 16(sp) | |
| add t6, t6, a0 | |
| ld s11, 112(sp) | |
| add s11, s11, a0 | |
| ld t0, 104(sp) | |
| add t0, t0, a0 | |
| ld t1, 96(sp) | |
| add t1, t1, a0 | |
| ld s2, 88(sp) | |
| add s2, s2, a0 | |
| ld s4, 80(sp) | |
| add s4, s4, a0 | |
| ld t5, 72(sp) | |
| add t5, t5, a0 | |
| ld s1, 64(sp) | |
| add s1, s1, a0 | |
| ld s6, 48(sp) | |
| add s6, s6, a0 | |
| ld a2, 8(sp) | |
| addi a2, a2, 1 | |
| addi a0, zero, 8 | |
| bne a2, a0, .LBB9_14 | |
| # %bb.23: # %for_begin43.preheader | |
| lui a0, 131072 | |
| addiw a0, a0, -1 | |
| sd a0, 48(sp) | |
| addi t6, zero, 14 | |
| addi a3, zero, 112 | |
| addi s2, zero, 18 | |
| lui a5, 1 | |
| mv a2, zero | |
| .LBB9_24: # %for_begin46.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB9_25 Depth 2 | |
| # Child Loop BB9_27 Depth 2 | |
| # Child Loop BB9_28 Depth 3 | |
| # Child Loop BB9_29 Depth 4 | |
| srli a0, a2, 3 | |
| ld a1, 48(sp) | |
| and t4, a0, a1 | |
| sd a2, 16(sp) | |
| andi s11, a2, 7 | |
| mul s4, t4, t6 | |
| mv a1, zero | |
| .LBB9_25: # %for_begin49.preheader | |
| # Parent Loop BB9_24 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a2, a1, s4 | |
| mul a2, a2, a3 | |
| or a2, a2, s11 | |
| sext.w a4, a2 | |
| slli a4, a4, 2 | |
| add a4, s9, a4 | |
| sw zero, 0(a4) | |
| ori a4, a2, 8 | |
| sext.w a4, a4 | |
| slli a4, a4, 2 | |
| add a4, s9, a4 | |
| sw zero, 0(a4) | |
| addiw a4, a2, 16 | |
| slli a4, a4, 2 | |
| add a4, s9, a4 | |
| sw zero, 0(a4) | |
| addiw a4, a2, 24 | |
| slli a4, a4, 2 | |
| add a4, s9, a4 | |
| sw zero, 0(a4) | |
| addiw a4, a2, 32 | |
| slli a4, a4, 2 | |
| add a4, s9, a4 | |
| sw zero, 0(a4) | |
| addiw a4, a2, 40 | |
| slli a4, a4, 2 | |
| add a4, s9, a4 | |
| sw zero, 0(a4) | |
| addiw a4, a2, 64 | |
| slli t5, a4, 2 | |
| addiw s1, a2, 72 | |
| slli s3, s1, 2 | |
| addiw s0, a2, 80 | |
| slli s0, s0, 2 | |
| addiw a0, a2, 88 | |
| slli a0, a0, 2 | |
| addiw a4, a2, 96 | |
| slli a4, a4, 2 | |
| addiw s1, a2, 104 | |
| slli s1, s1, 2 | |
| add s5, s9, s1 | |
| add s6, s9, a4 | |
| add s7, s9, a0 | |
| add s0, s9, s0 | |
| add s1, s9, s3 | |
| add a4, s9, t5 | |
| addiw a0, a2, 56 | |
| slli a0, a0, 2 | |
| add a0, s9, a0 | |
| addiw a2, a2, 48 | |
| slli a2, a2, 2 | |
| add a2, s9, a2 | |
| sw zero, 0(a2) | |
| sw zero, 0(a0) | |
| sw zero, 0(a4) | |
| sw zero, 0(s1) | |
| sw zero, 0(s0) | |
| sw zero, 0(s7) | |
| sw zero, 0(s6) | |
| sw zero, 0(s5) | |
| addi a0, a1, 1 | |
| addiw a2, a1, 1 | |
| mv a1, a0 | |
| bltu a2, t6, .LBB9_25 | |
| # %bb.26: # %for_begin52.preheader | |
| # in Loop: Header=BB9_24 Depth=1 | |
| slli a0, t4, 2 | |
| sd a0, 40(sp) | |
| mv a3, zero | |
| .LBB9_27: # %for_begin55.preheader | |
| # Parent Loop BB9_24 Depth=1 | |
| # => This Loop Header: Depth=2 | |
| # Child Loop BB9_28 Depth 3 | |
| # Child Loop BB9_29 Depth 4 | |
| srli a0, a3, 3 | |
| ld a1, 48(sp) | |
| and a0, a0, a1 | |
| ld a1, 40(sp) | |
| add a1, a0, a1 | |
| addi a2, zero, 200 | |
| mul a1, a1, a2 | |
| sd a3, 64(sp) | |
| andi s5, a3, 7 | |
| or a1, a1, s5 | |
| slli a1, a1, 3 | |
| or a1, a1, s11 | |
| mul s6, a0, s2 | |
| addiw a0, a1, 192 | |
| slli a0, a0, 2 | |
| sd a0, 208(sp) | |
| addiw a2, a1, 128 | |
| slli a0, a2, 2 | |
| sd a0, 184(sp) | |
| addiw a4, a1, 64 | |
| slli a0, a4, 2 | |
| sd a0, 176(sp) | |
| sext.w s0, a1 | |
| slli a3, s0, 2 | |
| addiw s1, a1, 1536 | |
| slli s10, s1, 2 | |
| addiw a0, a1, 1472 | |
| slli s7, a0, 2 | |
| addiw a2, a1, 640 | |
| slli a0, a2, 2 | |
| sd a0, 200(sp) | |
| addiw a2, a1, 576 | |
| slli a0, a2, 2 | |
| sd a0, 168(sp) | |
| addiw a4, a1, 512 | |
| slli a0, a4, 2 | |
| sd a0, 160(sp) | |
| addiw a7, a1, 448 | |
| slli a0, a7, 2 | |
| sd a0, 144(sp) | |
| addiw t0, a1, 384 | |
| slli a0, t0, 2 | |
| sd a0, 136(sp) | |
| addiw a6, a1, 320 | |
| slli s1, a6, 2 | |
| addiw t1, a1, 256 | |
| slli t1, t1, 2 | |
| addiw t2, a1, 1408 | |
| addiw t3, a1, 1280 | |
| addiw t4, a1, 704 | |
| addiw t5, a1, 768 | |
| addiw s3, a1, 832 | |
| addiw a6, a1, 896 | |
| addiw a4, a1, 960 | |
| addiw a2, a1, 1024 | |
| addiw a0, a1, 1088 | |
| addiw t0, a1, 1152 | |
| addiw a7, a1, 1216 | |
| addiw a1, a1, 1344 | |
| slli s0, a0, 2 | |
| slli a2, a2, 2 | |
| slli a4, a4, 2 | |
| slli a6, a6, 2 | |
| slli s3, s3, 2 | |
| slli t5, t5, 2 | |
| slli t4, t4, 2 | |
| slli t3, t3, 2 | |
| slli a7, a7, 2 | |
| slli t0, t0, 2 | |
| ld a0, 56(sp) | |
| add s7, a0, s7 | |
| add s10, a0, s10 | |
| slli t2, t2, 2 | |
| slli a1, a1, 2 | |
| add a3, a0, a3 | |
| sd a3, 192(sp) | |
| ld a3, 176(sp) | |
| add a3, a0, a3 | |
| sd a3, 176(sp) | |
| ld a3, 184(sp) | |
| add a3, a0, a3 | |
| sd a3, 184(sp) | |
| ld a3, 208(sp) | |
| add a3, a0, a3 | |
| sd a3, 208(sp) | |
| add a3, a0, t1 | |
| sd a3, 152(sp) | |
| add a3, a0, s1 | |
| sd a3, 112(sp) | |
| ld a3, 136(sp) | |
| add a3, a0, a3 | |
| sd a3, 120(sp) | |
| ld a3, 144(sp) | |
| add a3, a0, a3 | |
| sd a3, 144(sp) | |
| ld a3, 160(sp) | |
| add s1, a0, a3 | |
| ld a3, 168(sp) | |
| add t1, a0, a3 | |
| ld a3, 200(sp) | |
| add a3, a0, a3 | |
| add t4, a0, t4 | |
| add t5, a0, t5 | |
| add s3, a0, s3 | |
| add a6, a0, a6 | |
| add a4, a0, a4 | |
| add a2, a0, a2 | |
| add s0, a0, s0 | |
| add t0, a0, t0 | |
| add a7, a0, a7 | |
| add t3, a0, t3 | |
| add a1, a0, a1 | |
| add t2, a0, t2 | |
| flw ft0, 0(s10) | |
| flw ft1, 0(s7) | |
| flw ft2, 0(t2) | |
| flw ft3, 0(a1) | |
| flw ft4, 0(t3) | |
| flw ft5, 0(a7) | |
| flw fs3, 0(t0) | |
| flw fs4, 0(s0) | |
| flw fa0, 0(a2) | |
| flw fa1, 0(a4) | |
| flw fa2, 0(a6) | |
| flw fa3, 0(s3) | |
| flw fa4, 0(t5) | |
| flw fa5, 0(t4) | |
| flw fa6, 0(a3) | |
| flw fa7, 0(t1) | |
| flw ft8, 0(s1) | |
| ld a0, 144(sp) | |
| flw ft9, 0(a0) | |
| fsw ft9, 128(sp) | |
| ld a0, 120(sp) | |
| flw ft9, 0(a0) | |
| fsw ft9, 120(sp) | |
| ld a0, 112(sp) | |
| flw ft9, 0(a0) | |
| fsw ft9, 112(sp) | |
| ld a0, 152(sp) | |
| flw ft9, 0(a0) | |
| fsw ft9, 104(sp) | |
| ld a0, 208(sp) | |
| flw ft9, 0(a0) | |
| fsw ft9, 96(sp) | |
| ld a0, 184(sp) | |
| flw ft9, 0(a0) | |
| fsw ft9, 88(sp) | |
| ld a0, 176(sp) | |
| flw ft9, 0(a0) | |
| ld a0, 192(sp) | |
| flw fs0, 0(a0) | |
| mv s7, zero | |
| fsw ft0, 136(sp) | |
| fsw ft1, 80(sp) | |
| fsw ft2, 72(sp) | |
| .LBB9_28: # %for_begin58.preheader | |
| # Parent Loop BB9_24 Depth=1 | |
| # Parent Loop BB9_27 Depth=2 | |
| # => This Loop Header: Depth=3 | |
| # Child Loop BB9_29 Depth 4 | |
| add a0, s7, s6 | |
| slli a0, a0, 3 | |
| or a0, a0, s5 | |
| mul a1, a0, s2 | |
| add a0, s7, s4 | |
| addi a2, zero, 14 | |
| mul a0, a0, a2 | |
| slli a1, a1, 32 | |
| srli a1, a1, 32 | |
| slli a1, a1, 2 | |
| mv a4, zero | |
| .LBB9_29: # %for_body59 | |
| # Parent Loop BB9_24 Depth=1 | |
| # Parent Loop BB9_27 Depth=2 | |
| # Parent Loop BB9_28 Depth=3 | |
| # => This Inner Loop Header: Depth=4 | |
| add s0, s8, a1 | |
| flw fs5, 0(s0) | |
| fmul.s fs5, fs5, fs0 | |
| add s1, a4, a0 | |
| slli s1, s1, 3 | |
| or s1, s1, s11 | |
| sext.w s1, s1 | |
| slli s1, s1, 2 | |
| add s1, s9, s1 | |
| flw fs6, 0(s1) | |
| fadd.s fs5, fs5, fs6 | |
| flw fs6, 4(s0) | |
| fmul.s fs6, fs6, ft9 | |
| fadd.s ft11, fs6, fs5 | |
| fsw ft11, 176(sp) | |
| addiw a3, a5, -1776 | |
| add a3, s0, a3 | |
| flw fs5, 0(a3) | |
| fmul.s ft0, fs5, ft0 | |
| fsw ft0, 208(sp) | |
| addiw a3, a5, -1780 | |
| add a3, s0, a3 | |
| flw fs6, 0(a3) | |
| fmul.s ft0, fs6, ft1 | |
| fsw ft0, 200(sp) | |
| addiw a3, a5, -1784 | |
| add a3, s0, a3 | |
| flw fs7, 0(a3) | |
| fmul.s ft0, fs7, ft2 | |
| fsw ft0, 192(sp) | |
| addiw a3, a5, -1788 | |
| add a3, s0, a3 | |
| flw fs9, 0(a3) | |
| fmul.s ft0, fs9, ft3 | |
| fsw ft0, 184(sp) | |
| addiw a3, a5, -1792 | |
| add a3, s0, a3 | |
| flw fs10, 0(a3) | |
| fmul.s ft0, fs10, ft4 | |
| fsw ft0, 168(sp) | |
| flw fs11, 1744(s0) | |
| fmul.s ft0, fs11, ft5 | |
| fsw ft0, 160(sp) | |
| flw ft0, 1740(s0) | |
| fmul.s ft0, ft0, fs3 | |
| fsw ft0, 152(sp) | |
| flw ft1, 1736(s0) | |
| fmul.s ft0, ft1, fs4 | |
| fsw ft0, 144(sp) | |
| flw ft2, 1732(s0) | |
| fmul.s fs10, ft2, fa0 | |
| fmv.s fs9, ft3 | |
| flw ft3, 1728(s0) | |
| fmul.s fs8, ft3, fa1 | |
| fmv.s fs7, ft4 | |
| flw ft4, 1168(s0) | |
| fmul.s fs6, ft4, fa2 | |
| fmv.s fs5, ft5 | |
| flw ft5, 1164(s0) | |
| fmul.s fs2, ft5, fa3 | |
| flw ft6, 1160(s0) | |
| fmul.s fs1, ft6, fa4 | |
| flw ft7, 1156(s0) | |
| fmul.s ft11, ft7, fa5 | |
| fmv.s ft10, ft9 | |
| fmv.s ft9, fa0 | |
| flw fa0, 1152(s0) | |
| fmul.s fa0, fa0, fa6 | |
| fmv.s ft7, fa1 | |
| flw fa1, 592(s0) | |
| fmul.s fa1, fa1, fa7 | |
| fmv.s ft6, fa2 | |
| flw fa2, 588(s0) | |
| fmul.s fa2, fa2, ft8 | |
| fmv.s ft5, fa3 | |
| flw fa3, 584(s0) | |
| flw ft0, 128(sp) | |
| fmul.s fa3, fa3, ft0 | |
| fmv.s ft4, fa4 | |
| flw fa4, 580(s0) | |
| flw ft0, 120(sp) | |
| fmul.s fa4, fa4, ft0 | |
| fmv.s ft3, fa5 | |
| flw fa5, 576(s0) | |
| flw ft0, 112(sp) | |
| fmul.s fa5, fa5, ft0 | |
| fmv.s ft2, fa6 | |
| flw fa6, 16(s0) | |
| flw ft0, 104(sp) | |
| fmul.s fa6, fa6, ft0 | |
| fmv.s ft1, fa7 | |
| flw fa7, 12(s0) | |
| flw ft0, 96(sp) | |
| fmul.s fa7, fa7, ft0 | |
| fmv.s ft0, ft8 | |
| flw ft8, 8(s0) | |
| flw fs11, 88(sp) | |
| fmul.s ft8, ft8, fs11 | |
| flw fs11, 176(sp) | |
| fadd.s ft8, ft8, fs11 | |
| fadd.s fa7, fa7, ft8 | |
| fmv.s ft8, ft0 | |
| fadd.s fa6, fa6, fa7 | |
| fmv.s fa7, ft1 | |
| fadd.s fa5, fa5, fa6 | |
| fmv.s fa6, ft2 | |
| fadd.s fa4, fa4, fa5 | |
| fmv.s fa5, ft3 | |
| fadd.s fa3, fa3, fa4 | |
| fmv.s fa4, ft4 | |
| fadd.s fa2, fa2, fa3 | |
| fmv.s fa3, ft5 | |
| fadd.s fa1, fa1, fa2 | |
| fmv.s fa2, ft6 | |
| fadd.s fa0, fa0, fa1 | |
| fmv.s fa1, ft7 | |
| fadd.s ft7, ft11, fa0 | |
| fmv.s fa0, ft9 | |
| fmv.s ft9, ft10 | |
| fadd.s ft6, fs1, ft7 | |
| fadd.s ft5, fs2, ft6 | |
| fadd.s ft4, fs6, ft5 | |
| fmv.s ft5, fs5 | |
| fadd.s ft3, fs8, ft4 | |
| fmv.s ft4, fs7 | |
| fadd.s ft2, fs10, ft3 | |
| fmv.s ft3, fs9 | |
| flw ft0, 144(sp) | |
| fadd.s ft1, ft0, ft2 | |
| flw ft2, 72(sp) | |
| flw ft0, 152(sp) | |
| fadd.s ft0, ft0, ft1 | |
| flw ft1, 80(sp) | |
| flw ft11, 160(sp) | |
| fadd.s ft0, ft11, ft0 | |
| flw ft11, 168(sp) | |
| fadd.s ft0, ft11, ft0 | |
| flw ft11, 184(sp) | |
| fadd.s ft0, ft11, ft0 | |
| flw ft11, 192(sp) | |
| fadd.s ft0, ft11, ft0 | |
| flw ft11, 200(sp) | |
| fadd.s ft0, ft11, ft0 | |
| flw ft11, 208(sp) | |
| fadd.s ft0, ft11, ft0 | |
| fsw ft0, 0(s1) | |
| flw ft0, 136(sp) | |
| addi a1, a1, 4 | |
| addi a4, a4, 1 | |
| addi a2, a2, -1 | |
| bnez a2, .LBB9_29 | |
| # %bb.30: # %for_end60 | |
| # in Loop: Header=BB9_28 Depth=3 | |
| addi a0, s7, 1 | |
| addiw a1, s7, 1 | |
| mv s7, a0 | |
| bltu a1, t6, .LBB9_28 | |
| # %bb.31: # %for_end57 | |
| # in Loop: Header=BB9_27 Depth=2 | |
| ld a1, 64(sp) | |
| addi a0, a1, 1 | |
| addiw a1, a1, 1 | |
| mv a3, a0 | |
| addi a0, zero, 32 | |
| bltu a1, a0, .LBB9_27 | |
| # %bb.32: # %for_end54 | |
| # in Loop: Header=BB9_24 Depth=1 | |
| ld a1, 16(sp) | |
| addi a0, a1, 1 | |
| addiw a1, a1, 1 | |
| mv a2, a0 | |
| addi a3, zero, 112 | |
| addi a0, zero, 64 | |
| bltu a1, a0, .LBB9_24 | |
| # %bb.33: # %for_begin64.preheader.preheader | |
| ld a0, 56(sp) | |
| addi t5, a0, 28 | |
| addi a6, zero, 14 | |
| addi t0, zero, 112 | |
| addi t1, zero, 784 | |
| addi a7, zero, 64 | |
| mv t2, zero | |
| .LBB9_34: # %for_begin64.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB9_35 Depth 2 | |
| srliw a1, t2, 3 | |
| mul t3, a1, a6 | |
| andi t4, t2, 7 | |
| mv a2, zero | |
| mv a3, zero | |
| .LBB9_35: # %for_begin67.preheader | |
| # Parent Loop BB9_34 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add s1, a3, t3 | |
| mul s1, s1, t0 | |
| or s0, s1, t4 | |
| add s1, t5, a2 | |
| sext.w a5, s0 | |
| slli a5, a5, 2 | |
| add a5, s9, a5 | |
| flw ft0, 0(a5) | |
| fsw ft0, -28(s1) | |
| ori a5, s0, 8 | |
| sext.w a5, a5 | |
| slli a5, a5, 2 | |
| add a5, s9, a5 | |
| flw ft0, 0(a5) | |
| fsw ft0, -24(s1) | |
| addiw a5, s0, 16 | |
| slli a5, a5, 2 | |
| add a5, s9, a5 | |
| flw ft0, 0(a5) | |
| fsw ft0, -20(s1) | |
| addiw a5, s0, 48 | |
| slli t6, a5, 2 | |
| addiw a1, s0, 56 | |
| slli s2, a1, 2 | |
| addiw a4, s0, 64 | |
| slli s3, a4, 2 | |
| addiw a0, s0, 72 | |
| slli s4, a0, 2 | |
| addiw a5, s0, 80 | |
| slli s5, a5, 2 | |
| addiw a1, s0, 88 | |
| slli a1, a1, 2 | |
| addiw a4, s0, 96 | |
| slli a4, a4, 2 | |
| addiw a0, s0, 104 | |
| slli a0, a0, 2 | |
| addiw a5, s0, 32 | |
| slli s6, a5, 2 | |
| addiw a5, s0, 40 | |
| slli a5, a5, 2 | |
| add s7, s9, a0 | |
| add s10, s9, a4 | |
| add s11, s9, a1 | |
| add s5, s9, s5 | |
| add s4, s9, s4 | |
| add s3, s9, s3 | |
| add a0, s9, s2 | |
| add a4, s9, t6 | |
| add a5, s9, a5 | |
| add a1, s9, s6 | |
| addiw s0, s0, 24 | |
| slli s0, s0, 2 | |
| add s0, s9, s0 | |
| flw ft0, 0(s0) | |
| fsw ft0, -16(s1) | |
| flw ft0, 0(a1) | |
| fsw ft0, -12(s1) | |
| flw ft0, 0(a5) | |
| fsw ft0, -8(s1) | |
| flw ft0, 0(a4) | |
| fsw ft0, -4(s1) | |
| flw ft0, 0(a0) | |
| fsw ft0, 0(s1) | |
| flw ft0, 0(s3) | |
| fsw ft0, 4(s1) | |
| flw ft0, 0(s4) | |
| fsw ft0, 8(s1) | |
| flw ft0, 0(s5) | |
| fsw ft0, 12(s1) | |
| flw ft0, 0(s11) | |
| fsw ft0, 16(s1) | |
| flw ft0, 0(s10) | |
| fsw ft0, 20(s1) | |
| flw ft0, 0(s7) | |
| fsw ft0, 24(s1) | |
| addi a3, a3, 1 | |
| addi a2, a2, 56 | |
| bne a2, t1, .LBB9_35 | |
| # %bb.36: # %for_end66 | |
| # in Loop: Header=BB9_34 Depth=1 | |
| addi t5, t5, 784 | |
| addi t2, t2, 1 | |
| bne t2, a7, .LBB9_34 | |
| # %bb.37: # %for_begin70.preheader | |
| ld a0, 24(sp) | |
| addi a0, a0, 28 | |
| ld a1, 56(sp) | |
| addi a1, a1, 28 | |
| addi a2, zero, 784 | |
| addi a3, zero, 64 | |
| mv a4, zero | |
| .LBB9_38: # %for_begin73.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB9_39 Depth 2 | |
| slli a5, a4, 2 | |
| ld s1, 32(sp) | |
| add a5, s1, a5 | |
| flw ft0, 0(a5) | |
| mv a5, zero | |
| .LBB9_39: # %for_begin76.preheader | |
| # Parent Loop BB9_38 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add s1, a0, a5 | |
| add s0, a1, a5 | |
| flw ft1, -28(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -28(s1) | |
| flw ft1, -24(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -24(s1) | |
| flw ft1, -20(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -20(s1) | |
| flw ft1, -16(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -16(s1) | |
| flw ft1, -12(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -12(s1) | |
| flw ft1, -8(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -8(s1) | |
| flw ft1, -4(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, -4(s1) | |
| flw ft1, 0(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 0(s1) | |
| flw ft1, 4(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 4(s1) | |
| flw ft1, 8(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 8(s1) | |
| flw ft1, 12(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 12(s1) | |
| flw ft1, 16(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 16(s1) | |
| flw ft1, 20(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 20(s1) | |
| flw ft1, 24(s0) | |
| fadd.s ft1, ft0, ft1 | |
| fsw ft1, 24(s1) | |
| addi a5, a5, 56 | |
| bne a5, a2, .LBB9_39 | |
| # %bb.40: # %for_end75 | |
| # in Loop: Header=BB9_38 Depth=1 | |
| addi a0, a0, 784 | |
| addi a1, a1, 784 | |
| addi a4, a4, 1 | |
| bne a4, a3, .LBB9_38 | |
| # %bb.41: # %for_end72 | |
| mv a0, s9 | |
| call _ZdaPv | |
| mv a0, s8 | |
| call _ZdaPv | |
| ld a0, 56(sp) | |
| call _ZdaPv | |
| ld s11, 216(sp) | |
| ld s10, 224(sp) | |
| ld s9, 232(sp) | |
| ld s8, 240(sp) | |
| ld s7, 248(sp) | |
| ld s6, 256(sp) | |
| ld s5, 264(sp) | |
| ld s4, 272(sp) | |
| ld s3, 280(sp) | |
| ld s2, 288(sp) | |
| ld s1, 296(sp) | |
| ld s0, 304(sp) | |
| ld ra, 312(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| .cfi_restore s2 | |
| .cfi_restore s3 | |
| .cfi_restore s4 | |
| .cfi_restore s5 | |
| .cfi_restore s6 | |
| .cfi_restore s7 | |
| .cfi_restore s8 | |
| .cfi_restore s9 | |
| .cfi_restore s10 | |
| .cfi_restore s11 | |
| addi sp, sp, 320 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .Lfunc_end9: | |
| .size fuse_conv2d_1_compute_, .Lfunc_end9-fuse_conv2d_1_compute_ | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_relu_1 # -- Begin function fuse_relu_1 | |
| .p2align 2 | |
| .type fuse_relu_1,@function | |
| fuse_relu_1: # @fuse_relu_1 | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| .cfi_def_cfa_offset 32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB10_30 | |
| # %bb.1: # %assert_end | |
| lwu a4, 4(a1) | |
| ld a2, 8(a0) | |
| lwu a3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t0, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB10_3 | |
| # %bb.2: # %if_then | |
| lw a0, 0(a0) | |
| addi s0, zero, 1 | |
| bne a0, s0, .LBB10_31 | |
| .LBB10_3: # %if_end | |
| ld a7, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld s0, 32(a2) | |
| beqz s0, .LBB10_5 | |
| # %bb.4: # %if_then3 | |
| lw s0, 0(s0) | |
| addi s1, zero, 1 | |
| bne s0, s1, .LBB10_32 | |
| .LBB10_5: # %if_end4 | |
| addi s1, zero, 13 | |
| bltu s1, a3, .LBB10_25 | |
| # %bb.6: # %if_end4 | |
| addi s1, zero, 1 | |
| sll a3, s1, a3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB10_25 | |
| # %bb.7: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, a4, .LBB10_26 | |
| # %bb.8: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, a4 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a4, a4, s1 | |
| beqz a4, .LBB10_26 | |
| # %bb.9: # %assert_end10 | |
| bne t1, a3, .LBB10_33 | |
| # %bb.10: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB10_34 | |
| # %bb.11: # %assert_end14 | |
| lhu a3, 22(a5) | |
| bne a3, s0, .LBB10_35 | |
| # %bb.12: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB10_35 | |
| # %bb.13: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB10_35 | |
| # %bb.14: # %assert_end16 | |
| lui a3, 3 | |
| addiw a3, a3, 256 | |
| lw a4, 0(t0) | |
| bne a4, a3, .LBB10_36 | |
| # %bb.15: # %assert_end18 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB10_37 | |
| # %bb.16: # %assert_end20 | |
| lw a3, 16(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB10_38 | |
| # %bb.17: # %assert_end22 | |
| lhu a3, 22(a2) | |
| bne a3, s0, .LBB10_39 | |
| # %bb.18: # %assert_end22 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB10_39 | |
| # %bb.19: # %assert_end22 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB10_39 | |
| # %bb.20: # %assert_end24 | |
| lui a3, 3 | |
| addiw a3, a3, 256 | |
| lw a4, 0(a7) | |
| bne a4, a3, .LBB10_40 | |
| # %bb.21: # %assert_end26 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB10_41 | |
| # %bb.22: # %assert_end28 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB10_42 | |
| # %bb.23: # %assert_end30 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB10_44 | |
| # %bb.24: # %assert_end32 | |
| call fuse_relu_1_compute_ | |
| mv a0, zero | |
| j .LBB10_29 | |
| .LBB10_25: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.85) | |
| addi a0, a0, %lo(.L.str.85) | |
| j .LBB10_27 | |
| .LBB10_26: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.86) | |
| addi a0, a0, %lo(.L.str.86) | |
| .LBB10_27: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB10_28: # %assert_fail1 | |
| addi a0, a0, -1 | |
| .LBB10_29: # %assert_fail1 | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| addi sp, sp, 32 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB10_30: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.84) | |
| addi a0, a0, %lo(.L.str.84) | |
| j .LBB10_27 | |
| .LBB10_31: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.52) | |
| addi a0, a0, %lo(.L.str.52) | |
| j .LBB10_43 | |
| .LBB10_32: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.53) | |
| addi a0, a0, %lo(.L.str.53) | |
| jalr a1 | |
| slli a0, s1, 32 | |
| j .LBB10_28 | |
| .LBB10_33: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB10_27 | |
| .LBB10_34: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.56) | |
| addi a0, a0, %lo(.L.str.56) | |
| j .LBB10_43 | |
| .LBB10_35: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB10_27 | |
| .LBB10_36: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.87) | |
| addi a0, a0, %lo(.L.str.87) | |
| j .LBB10_27 | |
| .LBB10_37: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB10_27 | |
| .LBB10_38: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.58) | |
| addi a0, a0, %lo(.L.str.58) | |
| j .LBB10_43 | |
| .LBB10_39: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB10_27 | |
| .LBB10_40: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.88) | |
| addi a0, a0, %lo(.L.str.88) | |
| j .LBB10_27 | |
| .LBB10_41: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB10_27 | |
| .LBB10_42: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB10_43: # %assert_fail1 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB10_28 | |
| .LBB10_44: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB10_27 | |
| .Lfunc_end10: | |
| .size fuse_relu_1, .Lfunc_end10-fuse_relu_1 | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_relu_1_compute_ | |
| .LCPI11_0: | |
| .word 0 # float 0 | |
| .text | |
| .globl fuse_relu_1_compute_ | |
| .p2align 2 | |
| .type fuse_relu_1_compute_,@function | |
| fuse_relu_1_compute_: # @fuse_relu_1_compute_ | |
| # %bb.0: # %entry | |
| lui a2, 3 | |
| addiw a2, a2, 256 | |
| lui a3, %hi(.LCPI11_0) | |
| addi a3, a3, %lo(.LCPI11_0) | |
| flw ft0, 0(a3) | |
| .LBB11_1: # %for_body | |
| # =>This Inner Loop Header: Depth=1 | |
| flw ft1, 0(a1) | |
| fmax.s ft1, ft1, ft0 | |
| fsw ft1, 0(a0) | |
| addi a1, a1, 4 | |
| addi a0, a0, 4 | |
| addi a2, a2, -1 | |
| bnez a2, .LBB11_1 | |
| # %bb.2: # %for_end | |
| ret | |
| .Lfunc_end11: | |
| .size fuse_relu_1_compute_, .Lfunc_end11-fuse_relu_1_compute_ | |
| # -- End function | |
| .globl fuse_max_pool2d_1 # -- Begin function fuse_max_pool2d_1 | |
| .p2align 2 | |
| .type fuse_max_pool2d_1,@function | |
| fuse_max_pool2d_1: # @fuse_max_pool2d_1 | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -16 | |
| .cfi_def_cfa_offset 16 | |
| sd ra, 8(sp) | |
| sd s0, 0(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB12_42 | |
| # %bb.1: # %assert_end | |
| lwu t0, 4(a1) | |
| ld a2, 8(a0) | |
| lwu t3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t2, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB12_6 | |
| # %bb.2: # %if_then | |
| lui a3, 3 | |
| addiw a3, a3, 256 | |
| lw s0, 0(a0) | |
| bne s0, a3, .LBB12_43 | |
| # %bb.3: # %if_then | |
| ld a3, 8(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 196 | |
| bne a3, s0, .LBB12_43 | |
| # %bb.4: # %if_then | |
| ld a3, 16(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 14 | |
| bne a3, s0, .LBB12_43 | |
| # %bb.5: # %if_then | |
| ld a0, 24(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a3, zero, 1 | |
| bne a0, a3, .LBB12_43 | |
| .LBB12_6: # %if_end | |
| ld a7, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld a3, 32(a2) | |
| beqz a3, .LBB12_11 | |
| # %bb.7: # %if_then3 | |
| lui s0, 1 | |
| addiw s0, s0, -960 | |
| lw a4, 0(a3) | |
| bne a4, s0, .LBB12_44 | |
| # %bb.8: # %if_then3 | |
| ld a4, 8(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| addi s0, zero, 49 | |
| bne a4, s0, .LBB12_44 | |
| # %bb.9: # %if_then3 | |
| ld a4, 16(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| addi s0, zero, 7 | |
| bne a4, s0, .LBB12_44 | |
| # %bb.10: # %if_then3 | |
| ld a3, 24(a3) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi a4, zero, 1 | |
| bne a3, a4, .LBB12_44 | |
| .LBB12_11: # %if_end4 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB12_37 | |
| # %bb.12: # %if_end4 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui a4, 2 | |
| addiw a4, a4, 152 | |
| and a3, a3, a4 | |
| beqz a3, .LBB12_37 | |
| # %bb.13: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t0, .LBB12_38 | |
| # %bb.14: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, t0 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a4, a4, s0 | |
| beqz a4, .LBB12_38 | |
| # %bb.15: # %assert_end10 | |
| bne t1, a3, .LBB12_45 | |
| # %bb.16: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi a4, zero, 4 | |
| bne a3, a4, .LBB12_46 | |
| # %bb.17: # %assert_end14 | |
| lhu a3, 22(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB12_47 | |
| # %bb.18: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB12_47 | |
| # %bb.19: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB12_47 | |
| # %bb.20: # %assert_end16 | |
| lw a3, 0(t2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB12_48 | |
| # %bb.21: # %assert_end18 | |
| lw a3, 8(t2) | |
| addi a4, zero, 64 | |
| bne a3, a4, .LBB12_49 | |
| # %bb.22: # %assert_end20 | |
| lw a4, 16(t2) | |
| addi a3, zero, 14 | |
| bne a4, a3, .LBB12_50 | |
| # %bb.23: # %assert_end22 | |
| lw a4, 24(t2) | |
| bne a4, a3, .LBB12_51 | |
| # %bb.24: # %assert_end24 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB12_52 | |
| # %bb.25: # %assert_end26 | |
| lw a3, 16(a2) | |
| addi a4, zero, 4 | |
| bne a3, a4, .LBB12_53 | |
| # %bb.26: # %assert_end28 | |
| lhu a3, 22(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB12_54 | |
| # %bb.27: # %assert_end28 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB12_54 | |
| # %bb.28: # %assert_end28 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB12_54 | |
| # %bb.29: # %assert_end30 | |
| lw a3, 0(a7) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB12_55 | |
| # %bb.30: # %assert_end32 | |
| lw a3, 8(a7) | |
| addi a4, zero, 64 | |
| bne a3, a4, .LBB12_56 | |
| # %bb.31: # %assert_end34 | |
| lw a4, 16(a7) | |
| addi a3, zero, 7 | |
| bne a4, a3, .LBB12_57 | |
| # %bb.32: # %assert_end36 | |
| lw a4, 24(a7) | |
| bne a4, a3, .LBB12_58 | |
| # %bb.33: # %assert_end38 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB12_59 | |
| # %bb.34: # %assert_end40 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB12_60 | |
| # %bb.35: # %assert_end42 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB12_62 | |
| # %bb.36: # %assert_end44 | |
| call fuse_max_pool2d_1_compute_ | |
| mv a0, zero | |
| j .LBB12_41 | |
| .LBB12_37: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.92) | |
| addi a0, a0, %lo(.L.str.92) | |
| j .LBB12_39 | |
| .LBB12_38: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.93) | |
| addi a0, a0, %lo(.L.str.93) | |
| .LBB12_39: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB12_40: # %assert_fail15 | |
| addi a0, a0, -1 | |
| .LBB12_41: # %assert_fail15 | |
| ld s0, 0(sp) | |
| ld ra, 8(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| addi sp, sp, 16 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB12_42: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.89) | |
| addi a0, a0, %lo(.L.str.89) | |
| j .LBB12_39 | |
| .LBB12_43: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.90) | |
| addi a0, a0, %lo(.L.str.90) | |
| j .LBB12_39 | |
| .LBB12_44: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.91) | |
| addi a0, a0, %lo(.L.str.91) | |
| j .LBB12_39 | |
| .LBB12_45: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB12_39 | |
| .LBB12_46: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.29) | |
| addi a0, a0, %lo(.L.str.29) | |
| j .LBB12_39 | |
| .LBB12_47: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB12_61 | |
| .LBB12_48: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB12_61 | |
| .LBB12_49: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.94) | |
| addi a0, a0, %lo(.L.str.94) | |
| j .LBB12_39 | |
| .LBB12_50: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.77) | |
| addi a0, a0, %lo(.L.str.77) | |
| j .LBB12_39 | |
| .LBB12_51: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.78) | |
| addi a0, a0, %lo(.L.str.78) | |
| j .LBB12_39 | |
| .LBB12_52: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB12_39 | |
| .LBB12_53: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.11) | |
| addi a0, a0, %lo(.L.str.11) | |
| j .LBB12_39 | |
| .LBB12_54: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB12_61 | |
| .LBB12_55: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.13) | |
| addi a0, a0, %lo(.L.str.13) | |
| j .LBB12_61 | |
| .LBB12_56: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.95) | |
| addi a0, a0, %lo(.L.str.95) | |
| j .LBB12_39 | |
| .LBB12_57: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.96) | |
| addi a0, a0, %lo(.L.str.96) | |
| j .LBB12_39 | |
| .LBB12_58: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.97) | |
| addi a0, a0, %lo(.L.str.97) | |
| j .LBB12_39 | |
| .LBB12_59: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB12_39 | |
| .LBB12_60: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB12_61: # %assert_fail15 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB12_40 | |
| .LBB12_62: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB12_39 | |
| .Lfunc_end12: | |
| .size fuse_max_pool2d_1, .Lfunc_end12-fuse_max_pool2d_1 | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_max_pool2d_1_compute_ | |
| .LCPI13_0: | |
| .word 4286578687 # float -3.40282347E+38 | |
| .text | |
| .globl fuse_max_pool2d_1_compute_ | |
| .p2align 2 | |
| .type fuse_max_pool2d_1_compute_,@function | |
| fuse_max_pool2d_1_compute_: # @fuse_max_pool2d_1_compute_ | |
| # %bb.0: # %entry | |
| addi a7, a1, 56 | |
| lui a1, %hi(.LCPI13_0) | |
| addi a1, a1, %lo(.LCPI13_0) | |
| flw ft0, 0(a1) | |
| addi a2, zero, 220 | |
| addi a6, zero, 64 | |
| mv t0, zero | |
| j .LBB13_2 | |
| .LBB13_1: # %for_end3 | |
| # in Loop: Header=BB13_2 Depth=1 | |
| addi a7, a7, 784 | |
| addi a0, a0, 196 | |
| addi t0, t0, 1 | |
| beq t0, a6, .LBB13_60 | |
| .LBB13_2: # %for_begin1.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB13_4 Depth 2 | |
| addi a5, zero, 24 | |
| mv a1, a7 | |
| j .LBB13_4 | |
| .LBB13_3: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fsw ft1, 0(a3) | |
| addi a1, a1, 112 | |
| addi a5, a5, 28 | |
| beq a5, a2, .LBB13_1 | |
| .LBB13_4: # %for_begin4.preheader | |
| # Parent Loop BB13_2 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| flw ft2, -56(a1) | |
| flt.s a3, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a3, .LBB13_6 | |
| # %bb.5: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_6: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, -52(a1) | |
| flt.s a3, ft2, ft1 | |
| bnez a3, .LBB13_8 | |
| # %bb.7: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_8: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 0(a1) | |
| flt.s a3, ft2, ft1 | |
| bnez a3, .LBB13_10 | |
| # %bb.9: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_10: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 4(a1) | |
| flt.s a3, ft2, ft1 | |
| bnez a3, .LBB13_12 | |
| # %bb.11: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_12: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| add a3, a0, a5 | |
| fsw ft1, -24(a3) | |
| flw ft2, -48(a1) | |
| flt.s a4, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a4, .LBB13_14 | |
| # %bb.13: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_14: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, -44(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_16 | |
| # %bb.15: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_16: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 8(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_18 | |
| # %bb.17: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_18: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 12(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_20 | |
| # %bb.19: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_20: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fsw ft1, -20(a3) | |
| flw ft2, -40(a1) | |
| flt.s a4, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a4, .LBB13_22 | |
| # %bb.21: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_22: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, -36(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_24 | |
| # %bb.23: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_24: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 16(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_26 | |
| # %bb.25: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_26: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 20(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_28 | |
| # %bb.27: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_28: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fsw ft1, -16(a3) | |
| flw ft2, -32(a1) | |
| flt.s a4, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a4, .LBB13_30 | |
| # %bb.29: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_30: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, -28(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_32 | |
| # %bb.31: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_32: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 24(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_34 | |
| # %bb.33: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_34: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 28(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_36 | |
| # %bb.35: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_36: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fsw ft1, -12(a3) | |
| flw ft2, -24(a1) | |
| flt.s a4, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a4, .LBB13_38 | |
| # %bb.37: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_38: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, -20(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_40 | |
| # %bb.39: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_40: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 32(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_42 | |
| # %bb.41: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_42: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 36(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_44 | |
| # %bb.43: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_44: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fsw ft1, -8(a3) | |
| flw ft2, -16(a1) | |
| flt.s a4, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a4, .LBB13_46 | |
| # %bb.45: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_46: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, -12(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_48 | |
| # %bb.47: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_48: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 40(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_50 | |
| # %bb.49: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_50: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 44(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_52 | |
| # %bb.51: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_52: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fsw ft1, -4(a3) | |
| flw ft2, -8(a1) | |
| flt.s a4, ft2, ft0 | |
| fmv.s ft1, ft0 | |
| bnez a4, .LBB13_54 | |
| # %bb.53: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_54: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, -4(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_56 | |
| # %bb.55: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_56: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 48(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_58 | |
| # %bb.57: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| .LBB13_58: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| flw ft2, 52(a1) | |
| flt.s a4, ft2, ft1 | |
| bnez a4, .LBB13_3 | |
| # %bb.59: # %for_begin4.preheader | |
| # in Loop: Header=BB13_4 Depth=2 | |
| fmv.s ft1, ft2 | |
| j .LBB13_3 | |
| .LBB13_60: # %for_end | |
| ret | |
| .Lfunc_end13: | |
| .size fuse_max_pool2d_1_compute_, .Lfunc_end13-fuse_max_pool2d_1_compute_ | |
| # -- End function | |
| .globl fuse_transpose # -- Begin function fuse_transpose | |
| .p2align 2 | |
| .type fuse_transpose,@function | |
| fuse_transpose: # @fuse_transpose | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -16 | |
| .cfi_def_cfa_offset 16 | |
| sd ra, 8(sp) | |
| sd s0, 0(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB14_42 | |
| # %bb.1: # %assert_end | |
| lwu t0, 4(a1) | |
| ld a2, 8(a0) | |
| lwu t3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t2, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB14_6 | |
| # %bb.2: # %if_then | |
| lui a3, 1 | |
| addiw a3, a3, -960 | |
| lw s0, 0(a0) | |
| bne s0, a3, .LBB14_43 | |
| # %bb.3: # %if_then | |
| ld a3, 8(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 49 | |
| bne a3, s0, .LBB14_43 | |
| # %bb.4: # %if_then | |
| ld a3, 16(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 7 | |
| bne a3, s0, .LBB14_43 | |
| # %bb.5: # %if_then | |
| ld a0, 24(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a3, zero, 1 | |
| bne a0, a3, .LBB14_43 | |
| .LBB14_6: # %if_end | |
| ld a7, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld a3, 32(a2) | |
| beqz a3, .LBB14_11 | |
| # %bb.7: # %if_then3 | |
| lui s0, 1 | |
| addiw s0, s0, -960 | |
| lw a4, 0(a3) | |
| bne a4, s0, .LBB14_44 | |
| # %bb.8: # %if_then3 | |
| ld a4, 8(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| addi s0, zero, 448 | |
| bne a4, s0, .LBB14_44 | |
| # %bb.9: # %if_then3 | |
| ld a4, 16(a3) | |
| slli a4, a4, 32 | |
| srli a4, a4, 32 | |
| addi s0, zero, 64 | |
| bne a4, s0, .LBB14_44 | |
| # %bb.10: # %if_then3 | |
| ld a3, 24(a3) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi a4, zero, 1 | |
| bne a3, a4, .LBB14_44 | |
| .LBB14_11: # %if_end4 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB14_37 | |
| # %bb.12: # %if_end4 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui a4, 2 | |
| addiw a4, a4, 152 | |
| and a3, a3, a4 | |
| beqz a3, .LBB14_37 | |
| # %bb.13: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t0, .LBB14_38 | |
| # %bb.14: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, t0 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a4, a4, s0 | |
| beqz a4, .LBB14_38 | |
| # %bb.15: # %assert_end10 | |
| bne t1, a3, .LBB14_45 | |
| # %bb.16: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi a4, zero, 4 | |
| bne a3, a4, .LBB14_46 | |
| # %bb.17: # %assert_end14 | |
| lhu a3, 22(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB14_47 | |
| # %bb.18: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB14_47 | |
| # %bb.19: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB14_47 | |
| # %bb.20: # %assert_end16 | |
| lw a3, 0(t2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB14_48 | |
| # %bb.21: # %assert_end18 | |
| lw a3, 8(t2) | |
| addi a4, zero, 64 | |
| bne a3, a4, .LBB14_49 | |
| # %bb.22: # %assert_end20 | |
| lw a4, 16(t2) | |
| addi a3, zero, 7 | |
| bne a4, a3, .LBB14_50 | |
| # %bb.23: # %assert_end22 | |
| lw a4, 24(t2) | |
| bne a4, a3, .LBB14_51 | |
| # %bb.24: # %assert_end24 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB14_52 | |
| # %bb.25: # %assert_end26 | |
| lw a3, 16(a2) | |
| addi a4, zero, 4 | |
| bne a3, a4, .LBB14_53 | |
| # %bb.26: # %assert_end28 | |
| lhu a3, 22(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB14_54 | |
| # %bb.27: # %assert_end28 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB14_54 | |
| # %bb.28: # %assert_end28 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB14_54 | |
| # %bb.29: # %assert_end30 | |
| lw a3, 0(a7) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB14_55 | |
| # %bb.30: # %assert_end32 | |
| lw a4, 8(a7) | |
| addi a3, zero, 7 | |
| bne a4, a3, .LBB14_56 | |
| # %bb.31: # %assert_end34 | |
| lw a4, 16(a7) | |
| bne a4, a3, .LBB14_57 | |
| # %bb.32: # %assert_end36 | |
| lw a3, 24(a7) | |
| addi a4, zero, 64 | |
| bne a3, a4, .LBB14_58 | |
| # %bb.33: # %assert_end38 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB14_59 | |
| # %bb.34: # %assert_end40 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB14_60 | |
| # %bb.35: # %assert_end42 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB14_62 | |
| # %bb.36: # %assert_end44 | |
| call fuse_transpose_compute_ | |
| mv a0, zero | |
| j .LBB14_41 | |
| .LBB14_37: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.101) | |
| addi a0, a0, %lo(.L.str.101) | |
| j .LBB14_39 | |
| .LBB14_38: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.102) | |
| addi a0, a0, %lo(.L.str.102) | |
| .LBB14_39: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB14_40: # %assert_fail15 | |
| addi a0, a0, -1 | |
| .LBB14_41: # %assert_fail15 | |
| ld s0, 0(sp) | |
| ld ra, 8(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| addi sp, sp, 16 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB14_42: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.98) | |
| addi a0, a0, %lo(.L.str.98) | |
| j .LBB14_39 | |
| .LBB14_43: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.99) | |
| addi a0, a0, %lo(.L.str.99) | |
| j .LBB14_39 | |
| .LBB14_44: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.100) | |
| addi a0, a0, %lo(.L.str.100) | |
| j .LBB14_39 | |
| .LBB14_45: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB14_39 | |
| .LBB14_46: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.29) | |
| addi a0, a0, %lo(.L.str.29) | |
| j .LBB14_39 | |
| .LBB14_47: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB14_61 | |
| .LBB14_48: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB14_61 | |
| .LBB14_49: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.94) | |
| addi a0, a0, %lo(.L.str.94) | |
| j .LBB14_39 | |
| .LBB14_50: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.103) | |
| addi a0, a0, %lo(.L.str.103) | |
| j .LBB14_39 | |
| .LBB14_51: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.104) | |
| addi a0, a0, %lo(.L.str.104) | |
| j .LBB14_39 | |
| .LBB14_52: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB14_39 | |
| .LBB14_53: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.11) | |
| addi a0, a0, %lo(.L.str.11) | |
| j .LBB14_39 | |
| .LBB14_54: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB14_61 | |
| .LBB14_55: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.13) | |
| addi a0, a0, %lo(.L.str.13) | |
| j .LBB14_61 | |
| .LBB14_56: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.105) | |
| addi a0, a0, %lo(.L.str.105) | |
| j .LBB14_39 | |
| .LBB14_57: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.96) | |
| addi a0, a0, %lo(.L.str.96) | |
| j .LBB14_39 | |
| .LBB14_58: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.106) | |
| addi a0, a0, %lo(.L.str.106) | |
| j .LBB14_39 | |
| .LBB14_59: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB14_39 | |
| .LBB14_60: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB14_61: # %assert_fail15 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB14_40 | |
| .LBB14_62: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB14_39 | |
| .Lfunc_end14: | |
| .size fuse_transpose, .Lfunc_end14-fuse_transpose | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_transpose_compute_ # -- Begin function fuse_transpose_compute_ | |
| .p2align 2 | |
| .type fuse_transpose_compute_,@function | |
| fuse_transpose_compute_: # @fuse_transpose_compute_ | |
| # %bb.0: # %entry | |
| addi sp, sp, -48 | |
| sd s0, 40(sp) | |
| sd s1, 32(sp) | |
| sd s2, 24(sp) | |
| sd s3, 16(sp) | |
| sd s4, 8(sp) | |
| addi a6, a1, 24 | |
| addi a7, a1, 20 | |
| addi t0, a1, 16 | |
| addi t1, a1, 12 | |
| addi t2, a1, 8 | |
| addi t3, a1, 4 | |
| addi t4, zero, 256 | |
| addi t5, zero, 512 | |
| addi t6, zero, 768 | |
| addi s4, zero, 1024 | |
| addi a4, zero, 1280 | |
| addi a5, zero, 1536 | |
| addi a2, zero, 1792 | |
| addi s2, zero, 7 | |
| mv s3, zero | |
| .LBB15_1: # %for_begin1.preheader | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB15_2 Depth 2 | |
| # Child Loop BB15_4 Depth 2 | |
| # Child Loop BB15_6 Depth 2 | |
| # Child Loop BB15_8 Depth 2 | |
| # Child Loop BB15_10 Depth 2 | |
| # Child Loop BB15_12 Depth 2 | |
| # Child Loop BB15_14 Depth 2 | |
| mv s0, a1 | |
| mv s1, zero | |
| .LBB15_2: # %for_body5 | |
| # Parent Loop BB15_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a3, a0, s1 | |
| flw ft0, 0(s0) | |
| fsw ft0, 0(a3) | |
| addi s0, s0, 196 | |
| addi s1, s1, 4 | |
| bne s1, t4, .LBB15_2 | |
| # %bb.3: # %for_end6 | |
| # in Loop: Header=BB15_1 Depth=1 | |
| addi s0, zero, 256 | |
| mv s1, t3 | |
| .LBB15_4: # %for_body5.1 | |
| # Parent Loop BB15_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a3, a0, s0 | |
| flw ft0, 0(s1) | |
| fsw ft0, 0(a3) | |
| addi s1, s1, 196 | |
| addi s0, s0, 4 | |
| bne s0, t5, .LBB15_4 | |
| # %bb.5: # %for_end6.1 | |
| # in Loop: Header=BB15_1 Depth=1 | |
| addi s0, zero, 512 | |
| mv s1, t2 | |
| .LBB15_6: # %for_body5.2 | |
| # Parent Loop BB15_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a3, a0, s0 | |
| flw ft0, 0(s1) | |
| fsw ft0, 0(a3) | |
| addi s1, s1, 196 | |
| addi s0, s0, 4 | |
| bne s0, t6, .LBB15_6 | |
| # %bb.7: # %for_end6.2 | |
| # in Loop: Header=BB15_1 Depth=1 | |
| addi s0, zero, 768 | |
| mv s1, t1 | |
| .LBB15_8: # %for_body5.3 | |
| # Parent Loop BB15_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a3, a0, s0 | |
| flw ft0, 0(s1) | |
| fsw ft0, 0(a3) | |
| addi s1, s1, 196 | |
| addi s0, s0, 4 | |
| bne s0, s4, .LBB15_8 | |
| # %bb.9: # %for_end6.3 | |
| # in Loop: Header=BB15_1 Depth=1 | |
| addi s0, zero, 1024 | |
| mv s1, t0 | |
| .LBB15_10: # %for_body5.4 | |
| # Parent Loop BB15_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a3, a0, s0 | |
| flw ft0, 0(s1) | |
| fsw ft0, 0(a3) | |
| addi s1, s1, 196 | |
| addi s0, s0, 4 | |
| bne s0, a4, .LBB15_10 | |
| # %bb.11: # %for_end6.4 | |
| # in Loop: Header=BB15_1 Depth=1 | |
| addi s0, zero, 1280 | |
| mv s1, a7 | |
| .LBB15_12: # %for_body5.5 | |
| # Parent Loop BB15_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a3, a0, s0 | |
| flw ft0, 0(s1) | |
| fsw ft0, 0(a3) | |
| addi s1, s1, 196 | |
| addi s0, s0, 4 | |
| bne s0, a5, .LBB15_12 | |
| # %bb.13: # %for_end6.5 | |
| # in Loop: Header=BB15_1 Depth=1 | |
| addi s0, zero, 1536 | |
| mv s1, a6 | |
| .LBB15_14: # %for_body5.6 | |
| # Parent Loop BB15_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| add a3, a0, s0 | |
| flw ft0, 0(s1) | |
| fsw ft0, 0(a3) | |
| addi s1, s1, 196 | |
| addi s0, s0, 4 | |
| bne s0, a2, .LBB15_14 | |
| # %bb.15: # %for_end6.6 | |
| # in Loop: Header=BB15_1 Depth=1 | |
| addi a6, a6, 28 | |
| addi a7, a7, 28 | |
| addi t0, t0, 28 | |
| addi t1, t1, 28 | |
| addi t2, t2, 28 | |
| addi t3, t3, 28 | |
| addi a0, a0, 1792 | |
| addi a1, a1, 28 | |
| addi s3, s3, 1 | |
| bne s3, s2, .LBB15_1 | |
| # %bb.16: # %for_end | |
| ld s4, 8(sp) | |
| ld s3, 16(sp) | |
| ld s2, 24(sp) | |
| ld s1, 32(sp) | |
| ld s0, 40(sp) | |
| addi sp, sp, 48 | |
| ret | |
| .Lfunc_end15: | |
| .size fuse_transpose_compute_, .Lfunc_end15-fuse_transpose_compute_ | |
| # -- End function | |
| .globl fuse_reshape_1 # -- Begin function fuse_reshape_1 | |
| .p2align 2 | |
| .type fuse_reshape_1,@function | |
| fuse_reshape_1: # @fuse_reshape_1 | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -16 | |
| .cfi_def_cfa_offset 16 | |
| sd ra, 8(sp) | |
| sd s0, 0(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB16_38 | |
| # %bb.1: # %assert_end | |
| lwu t0, 4(a1) | |
| ld a2, 8(a0) | |
| lwu t3, 0(a1) | |
| ld a4, 0(a0) | |
| ld t2, 24(a4) | |
| ld a1, 0(a4) | |
| ld a0, 32(a4) | |
| beqz a0, .LBB16_6 | |
| # %bb.2: # %if_then | |
| lui s0, 1 | |
| addiw s0, s0, -960 | |
| lw a3, 0(a0) | |
| bne a3, s0, .LBB16_39 | |
| # %bb.3: # %if_then | |
| ld a3, 8(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 448 | |
| bne a3, s0, .LBB16_39 | |
| # %bb.4: # %if_then | |
| ld a3, 16(a0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 64 | |
| bne a3, s0, .LBB16_39 | |
| # %bb.5: # %if_then | |
| ld a0, 24(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a3, zero, 1 | |
| bne a0, a3, .LBB16_39 | |
| .LBB16_6: # %if_end | |
| ld a7, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a4) | |
| lwu t1, 8(a4) | |
| ld s0, 32(a2) | |
| beqz s0, .LBB16_9 | |
| # %bb.7: # %if_then3 | |
| lui a3, 1 | |
| addiw a3, a3, -960 | |
| lw a5, 0(s0) | |
| bne a5, a3, .LBB16_40 | |
| # %bb.8: # %if_then3 | |
| ld a3, 8(s0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi a5, zero, 1 | |
| bne a3, a5, .LBB16_40 | |
| .LBB16_9: # %if_end4 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB16_33 | |
| # %bb.10: # %if_end4 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui a5, 2 | |
| addiw a5, a5, 152 | |
| and a3, a3, a5 | |
| beqz a3, .LBB16_33 | |
| # %bb.11: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t0, .LBB16_34 | |
| # %bb.12: # %assert_end8 | |
| addi a5, zero, 1 | |
| sll a3, a5, t0 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a3, a3, s0 | |
| beqz a3, .LBB16_34 | |
| # %bb.13: # %assert_end10 | |
| bne t1, a5, .LBB16_41 | |
| # %bb.14: # %assert_end12 | |
| lw a3, 16(a4) | |
| addi a5, zero, 4 | |
| bne a3, a5, .LBB16_42 | |
| # %bb.15: # %assert_end14 | |
| lhu a3, 22(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB16_43 | |
| # %bb.16: # %assert_end14 | |
| lbu a3, 21(a4) | |
| addi a5, zero, 32 | |
| bne a3, a5, .LBB16_43 | |
| # %bb.17: # %assert_end14 | |
| lbu a3, 20(a4) | |
| addi a5, zero, 2 | |
| bne a3, a5, .LBB16_43 | |
| # %bb.18: # %assert_end16 | |
| lw a3, 0(t2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB16_44 | |
| # %bb.19: # %assert_end18 | |
| lw a3, 8(t2) | |
| addi a5, zero, 7 | |
| bne a3, a5, .LBB16_45 | |
| # %bb.20: # %assert_end20 | |
| lw a3, 16(t2) | |
| bne a3, a5, .LBB16_46 | |
| # %bb.21: # %assert_end22 | |
| lw a3, 24(t2) | |
| addi a5, zero, 64 | |
| bne a3, a5, .LBB16_47 | |
| # %bb.22: # %assert_end24 | |
| ld a3, 40(a4) | |
| bnez a3, .LBB16_48 | |
| # %bb.23: # %assert_end26 | |
| lw a3, 16(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB16_49 | |
| # %bb.24: # %assert_end28 | |
| lhu a3, 22(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB16_50 | |
| # %bb.25: # %assert_end28 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB16_50 | |
| # %bb.26: # %assert_end28 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB16_50 | |
| # %bb.27: # %assert_end30 | |
| lw a3, 0(a7) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB16_51 | |
| # %bb.28: # %assert_end32 | |
| lui a3, 1 | |
| addiw a3, a3, -960 | |
| lw a4, 8(a7) | |
| bne a4, a3, .LBB16_52 | |
| # %bb.29: # %assert_end34 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB16_53 | |
| # %bb.30: # %assert_end36 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB16_54 | |
| # %bb.31: # %assert_end38 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB16_56 | |
| # %bb.32: # %assert_end40 | |
| call fuse_reshape_1_compute_ | |
| mv a0, zero | |
| j .LBB16_37 | |
| .LBB16_33: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.110) | |
| addi a0, a0, %lo(.L.str.110) | |
| j .LBB16_35 | |
| .LBB16_34: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.111) | |
| addi a0, a0, %lo(.L.str.111) | |
| .LBB16_35: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB16_36: # %assert_fail15 | |
| addi a0, a0, -1 | |
| .LBB16_37: # %assert_fail15 | |
| ld s0, 0(sp) | |
| ld ra, 8(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| addi sp, sp, 16 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB16_38: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.107) | |
| addi a0, a0, %lo(.L.str.107) | |
| j .LBB16_35 | |
| .LBB16_39: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.108) | |
| addi a0, a0, %lo(.L.str.108) | |
| j .LBB16_35 | |
| .LBB16_40: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.109) | |
| addi a0, a0, %lo(.L.str.109) | |
| j .LBB16_35 | |
| .LBB16_41: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB16_35 | |
| .LBB16_42: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.29) | |
| addi a0, a0, %lo(.L.str.29) | |
| j .LBB16_35 | |
| .LBB16_43: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB16_55 | |
| .LBB16_44: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB16_55 | |
| .LBB16_45: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.112) | |
| addi a0, a0, %lo(.L.str.112) | |
| j .LBB16_35 | |
| .LBB16_46: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.103) | |
| addi a0, a0, %lo(.L.str.103) | |
| j .LBB16_35 | |
| .LBB16_47: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.113) | |
| addi a0, a0, %lo(.L.str.113) | |
| j .LBB16_35 | |
| .LBB16_48: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB16_35 | |
| .LBB16_49: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.114) | |
| addi a0, a0, %lo(.L.str.114) | |
| j .LBB16_35 | |
| .LBB16_50: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB16_55 | |
| .LBB16_51: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.13) | |
| addi a0, a0, %lo(.L.str.13) | |
| j .LBB16_55 | |
| .LBB16_52: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.115) | |
| addi a0, a0, %lo(.L.str.115) | |
| j .LBB16_35 | |
| .LBB16_53: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB16_35 | |
| .LBB16_54: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB16_55: # %assert_fail15 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB16_36 | |
| .LBB16_56: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB16_35 | |
| .Lfunc_end16: | |
| .size fuse_reshape_1, .Lfunc_end16-fuse_reshape_1 | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_reshape_1_compute_ # -- Begin function fuse_reshape_1_compute_ | |
| .p2align 2 | |
| .type fuse_reshape_1_compute_,@function | |
| fuse_reshape_1_compute_: # @fuse_reshape_1_compute_ | |
| # %bb.0: # %entry | |
| addi sp, sp, -16 | |
| sd ra, 8(sp) | |
| lui a2, 3 | |
| addiw a2, a2, 256 | |
| call memcpy | |
| ld ra, 8(sp) | |
| addi sp, sp, 16 | |
| ret | |
| .Lfunc_end17: | |
| .size fuse_reshape_1_compute_, .Lfunc_end17-fuse_reshape_1_compute_ | |
| # -- End function | |
| .globl fuse_matmul # -- Begin function fuse_matmul | |
| .p2align 2 | |
| .type fuse_matmul,@function | |
| fuse_matmul: # @fuse_matmul | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| .cfi_def_cfa_offset 32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 3 | |
| bne a2, a3, .LBB18_49 | |
| # %bb.1: # %assert_end | |
| lwu t2, 8(a1) | |
| ld t5, 16(a0) | |
| lwu t3, 4(a1) | |
| ld a4, 8(a0) | |
| lwu t6, 0(a1) | |
| ld a5, 0(a0) | |
| ld t1, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB18_4 | |
| # %bb.2: # %if_then | |
| lui a2, 1 | |
| addiw a2, a2, -960 | |
| lw s0, 0(a0) | |
| bne s0, a2, .LBB18_50 | |
| # %bb.3: # %if_then | |
| ld a0, 8(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a2, zero, 1 | |
| bne a0, a2, .LBB18_50 | |
| .LBB18_4: # %if_end | |
| ld t0, 24(a4) | |
| ld a2, 0(a4) | |
| lwu a6, 12(a5) | |
| lwu t4, 8(a5) | |
| ld a0, 32(a4) | |
| beqz a0, .LBB18_7 | |
| # %bb.5: # %if_then3 | |
| lw s0, 0(a0) | |
| addi a3, zero, 100 | |
| bne s0, a3, .LBB18_51 | |
| # %bb.6: # %if_then3 | |
| ld a0, 8(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a3, zero, 1 | |
| bne a0, a3, .LBB18_51 | |
| .LBB18_7: # %if_end4 | |
| ld a7, 24(t5) | |
| ld a0, 0(t5) | |
| ld s0, 32(t5) | |
| beqz s0, .LBB18_10 | |
| # %bb.8: # %if_then7 | |
| lw a3, 0(s0) | |
| addi s1, zero, 100 | |
| bne a3, s1, .LBB18_52 | |
| # %bb.9: # %if_then7 | |
| ld a3, 8(s0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB18_52 | |
| .LBB18_10: # %if_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t6, .LBB18_43 | |
| # %bb.11: # %if_end8 | |
| addi a3, zero, 1 | |
| sll a3, a3, t6 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB18_43 | |
| # %bb.12: # %assert_end12 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB18_44 | |
| # %bb.13: # %assert_end12 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB18_44 | |
| # %bb.14: # %assert_end14 | |
| addi a3, zero, 13 | |
| bltu a3, t2, .LBB18_45 | |
| # %bb.15: # %assert_end14 | |
| addi a3, zero, 1 | |
| sll s1, a3, t2 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and s1, s1, s0 | |
| beqz s1, .LBB18_45 | |
| # %bb.16: # %assert_end16 | |
| bne t4, a3, .LBB18_53 | |
| # %bb.17: # %assert_end18 | |
| lw a3, 16(a5) | |
| addi s1, zero, 2 | |
| bne a3, s1, .LBB18_54 | |
| # %bb.18: # %assert_end20 | |
| lhu a3, 22(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB18_55 | |
| # %bb.19: # %assert_end20 | |
| lbu a3, 21(a5) | |
| addi s1, zero, 32 | |
| bne a3, s1, .LBB18_55 | |
| # %bb.20: # %assert_end20 | |
| lbu a3, 20(a5) | |
| addi s1, zero, 2 | |
| bne a3, s1, .LBB18_55 | |
| # %bb.21: # %assert_end22 | |
| lw a3, 0(t1) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB18_56 | |
| # %bb.22: # %assert_end24 | |
| lui a3, 1 | |
| addiw a3, a3, -960 | |
| lw s1, 8(t1) | |
| bne s1, a3, .LBB18_57 | |
| # %bb.23: # %assert_end26 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB18_58 | |
| # %bb.24: # %assert_end28 | |
| lw a3, 16(a4) | |
| addi a5, zero, 2 | |
| bne a3, a5, .LBB18_59 | |
| # %bb.25: # %assert_end30 | |
| lhu a3, 22(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB18_60 | |
| # %bb.26: # %assert_end30 | |
| lbu a3, 21(a4) | |
| addi a5, zero, 32 | |
| bne a3, a5, .LBB18_60 | |
| # %bb.27: # %assert_end30 | |
| lbu a3, 20(a4) | |
| addi a5, zero, 2 | |
| bne a3, a5, .LBB18_60 | |
| # %bb.28: # %assert_end32 | |
| lui a3, 1 | |
| addiw a3, a3, -960 | |
| lw a5, 0(t0) | |
| bne a5, a3, .LBB18_61 | |
| # %bb.29: # %assert_end34 | |
| lw a3, 8(t0) | |
| addi a5, zero, 100 | |
| bne a3, a5, .LBB18_62 | |
| # %bb.30: # %assert_end36 | |
| ld a3, 40(a4) | |
| bnez a3, .LBB18_63 | |
| # %bb.31: # %assert_end38 | |
| lw a3, 8(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB18_64 | |
| # %bb.32: # %assert_end40 | |
| lw a4, 12(a4) | |
| sext.w a3, a6 | |
| bne a3, a4, .LBB18_65 | |
| # %bb.33: # %assert_end42 | |
| lw a4, 16(t5) | |
| addi a5, zero, 2 | |
| bne a4, a5, .LBB18_66 | |
| # %bb.34: # %assert_end44 | |
| lhu a4, 22(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB18_67 | |
| # %bb.35: # %assert_end44 | |
| lbu a4, 21(t5) | |
| addi a5, zero, 32 | |
| bne a4, a5, .LBB18_67 | |
| # %bb.36: # %assert_end44 | |
| lbu a4, 20(t5) | |
| addi a5, zero, 2 | |
| bne a4, a5, .LBB18_67 | |
| # %bb.37: # %assert_end46 | |
| lw a4, 0(a7) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB18_68 | |
| # %bb.38: # %assert_end48 | |
| lw a4, 8(a7) | |
| addi a5, zero, 100 | |
| bne a4, a5, .LBB18_69 | |
| # %bb.39: # %assert_end50 | |
| ld a4, 40(t5) | |
| bnez a4, .LBB18_70 | |
| # %bb.40: # %assert_end52 | |
| lw a4, 8(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB18_71 | |
| # %bb.41: # %assert_end54 | |
| lw a4, 12(t5) | |
| bne a3, a4, .LBB18_73 | |
| # %bb.42: # %assert_end56 | |
| call fuse_matmul_compute_ | |
| mv a0, zero | |
| j .LBB18_48 | |
| .LBB18_43: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.120) | |
| addi a0, a0, %lo(.L.str.120) | |
| j .LBB18_46 | |
| .LBB18_44: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.121) | |
| addi a0, a0, %lo(.L.str.121) | |
| j .LBB18_46 | |
| .LBB18_45: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.122) | |
| addi a0, a0, %lo(.L.str.122) | |
| .LBB18_46: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB18_47: # %assert_fail21 | |
| addi a0, a0, -1 | |
| .LBB18_48: # %assert_fail21 | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| addi sp, sp, 32 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB18_49: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.116) | |
| addi a0, a0, %lo(.L.str.116) | |
| j .LBB18_46 | |
| .LBB18_50: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.117) | |
| addi a0, a0, %lo(.L.str.117) | |
| j .LBB18_46 | |
| .LBB18_51: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.118) | |
| addi a0, a0, %lo(.L.str.118) | |
| j .LBB18_46 | |
| .LBB18_52: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.119) | |
| addi a0, a0, %lo(.L.str.119) | |
| j .LBB18_46 | |
| .LBB18_53: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB18_46 | |
| .LBB18_54: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.6) | |
| addi a0, a0, %lo(.L.str.6) | |
| j .LBB18_46 | |
| .LBB18_55: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB18_72 | |
| .LBB18_56: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB18_72 | |
| .LBB18_57: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.123) | |
| addi a0, a0, %lo(.L.str.123) | |
| j .LBB18_46 | |
| .LBB18_58: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB18_46 | |
| .LBB18_59: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.114) | |
| addi a0, a0, %lo(.L.str.114) | |
| j .LBB18_46 | |
| .LBB18_60: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB18_72 | |
| .LBB18_61: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.124) | |
| addi a0, a0, %lo(.L.str.124) | |
| j .LBB18_46 | |
| .LBB18_62: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.125) | |
| addi a0, a0, %lo(.L.str.125) | |
| j .LBB18_46 | |
| .LBB18_63: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB18_46 | |
| .LBB18_64: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| j .LBB18_72 | |
| .LBB18_65: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB18_46 | |
| .LBB18_66: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.126) | |
| addi a0, a0, %lo(.L.str.126) | |
| j .LBB18_46 | |
| .LBB18_67: # %assert_fail45 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.37) | |
| addi a0, a0, %lo(.L.str.37) | |
| j .LBB18_72 | |
| .LBB18_68: # %assert_fail47 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.127) | |
| addi a0, a0, %lo(.L.str.127) | |
| j .LBB18_72 | |
| .LBB18_69: # %assert_fail49 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.128) | |
| addi a0, a0, %lo(.L.str.128) | |
| j .LBB18_46 | |
| .LBB18_70: # %assert_fail51 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.39) | |
| addi a0, a0, %lo(.L.str.39) | |
| j .LBB18_46 | |
| .LBB18_71: # %assert_fail53 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.40) | |
| addi a0, a0, %lo(.L.str.40) | |
| .LBB18_72: # %assert_fail21 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB18_47 | |
| .LBB18_73: # %assert_fail55 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.41) | |
| addi a0, a0, %lo(.L.str.41) | |
| j .LBB18_46 | |
| .Lfunc_end18: | |
| .size fuse_matmul, .Lfunc_end18-fuse_matmul | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_matmul_compute_ | |
| .LCPI19_0: | |
| .word 0 # float 0 | |
| .text | |
| .globl fuse_matmul_compute_ | |
| .p2align 2 | |
| .type fuse_matmul_compute_,@function | |
| fuse_matmul_compute_: # @fuse_matmul_compute_ | |
| # %bb.0: # %entry | |
| lui a3, %hi(.LCPI19_0) | |
| addi a3, a3, %lo(.LCPI19_0) | |
| flw ft0, 0(a3) | |
| fmv.x.w a3, ft0 | |
| vmv.v.x v0, a3 | |
| vslide1up.vx v1, v0, a3 | |
| vslide1up.vx v0, v1, a3 | |
| vslide1up.vx v1, v0, a3 | |
| vslide1up.vx v0, v1, a3 | |
| lui a3, 1 | |
| addiw a7, a3, -960 | |
| addi t1, zero, 8 | |
| addi t2, zero, 4 | |
| addi a6, zero, 25 | |
| mv t0, zero | |
| .LBB19_1: # %for_body | |
| # =>This Loop Header: Depth=1 | |
| # Child Loop BB19_2 Depth 2 | |
| slli a3, t0, 4 | |
| add t3, a0, a3 | |
| vse.v v0, ( t3 ) | |
| mv t4, a1 | |
| mv a5, a2 | |
| mv a3, a7 | |
| .LBB19_2: # %for_body2 | |
| # Parent Loop BB19_1 Depth=1 | |
| # => This Inner Loop Header: Depth=2 | |
| flw ft0, 0(t4) | |
| vsetvl a4, t2, t1 | |
| vle.v v1, ( a5 ) | |
| vsetvl a4, t2, t1 | |
| fmv.x.w a4, ft0 | |
| vmv.v.x v2, a4 | |
| vslide1up.vx v3, v2, a4 | |
| vslide1up.vx v2, v3, a4 | |
| vslide1up.vx v3, v2, a4 | |
| vslide1up.vx v2, v3, a4 | |
| vfmul.vv v1, v2, v1 | |
| vle.v v2, ( t3 ) | |
| vfadd.vv v1, v1, v2 | |
| vse.v v1, ( t3 ) | |
| addi t4, t4, 4 | |
| addi a5, a5, 400 | |
| addi a3, a3, -1 | |
| bnez a3, .LBB19_2 | |
| # %bb.3: # %for_end3 | |
| # in Loop: Header=BB19_1 Depth=1 | |
| addi a2, a2, 16 | |
| addi t0, t0, 1 | |
| bne t0, a6, .LBB19_1 | |
| # %bb.4: # %for_end | |
| ret | |
| .Lfunc_end19: | |
| .size fuse_matmul_compute_, .Lfunc_end19-fuse_matmul_compute_ | |
| # -- End function | |
| .globl fuse_elemwise_add # -- Begin function fuse_elemwise_add | |
| .p2align 2 | |
| .type fuse_elemwise_add,@function | |
| fuse_elemwise_add: # @fuse_elemwise_add | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| .cfi_def_cfa_offset 32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 3 | |
| bne a2, a3, .LBB20_43 | |
| # %bb.1: # %assert_end | |
| lwu t2, 8(a1) | |
| ld t5, 16(a0) | |
| lwu t3, 4(a1) | |
| ld a4, 8(a0) | |
| lwu a3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t1, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB20_3 | |
| # %bb.2: # %if_then | |
| lw a0, 0(a0) | |
| addi s0, zero, 1 | |
| bne a0, s0, .LBB20_44 | |
| .LBB20_3: # %if_end | |
| ld t0, 24(a4) | |
| ld a2, 0(a4) | |
| lwu a7, 12(a5) | |
| lwu t4, 8(a5) | |
| ld a0, 32(a4) | |
| beqz a0, .LBB20_5 | |
| # %bb.4: # %if_then3 | |
| lw a0, 0(a0) | |
| addi s0, zero, 1 | |
| bne a0, s0, .LBB20_45 | |
| .LBB20_5: # %if_end4 | |
| ld a6, 24(t5) | |
| ld a0, 0(t5) | |
| ld s0, 32(t5) | |
| beqz s0, .LBB20_7 | |
| # %bb.6: # %if_then7 | |
| lw s0, 0(s0) | |
| addi s1, zero, 1 | |
| bne s0, s1, .LBB20_46 | |
| .LBB20_7: # %if_end8 | |
| addi s1, zero, 13 | |
| bltu s1, a3, .LBB20_37 | |
| # %bb.8: # %if_end8 | |
| addi s1, zero, 1 | |
| sll a3, s1, a3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB20_37 | |
| # %bb.9: # %assert_end12 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB20_38 | |
| # %bb.10: # %assert_end12 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB20_38 | |
| # %bb.11: # %assert_end14 | |
| addi a3, zero, 13 | |
| bltu a3, t2, .LBB20_39 | |
| # %bb.12: # %assert_end14 | |
| addi a3, zero, 1 | |
| sll s1, a3, t2 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and s1, s1, s0 | |
| beqz s1, .LBB20_39 | |
| # %bb.13: # %assert_end16 | |
| bne t4, a3, .LBB20_47 | |
| # %bb.14: # %assert_end18 | |
| lw a3, 16(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB20_48 | |
| # %bb.15: # %assert_end20 | |
| lhu a3, 22(a5) | |
| bne a3, s0, .LBB20_49 | |
| # %bb.16: # %assert_end20 | |
| lbu a3, 21(a5) | |
| addi s1, zero, 32 | |
| bne a3, s1, .LBB20_49 | |
| # %bb.17: # %assert_end20 | |
| lbu a3, 20(a5) | |
| addi s1, zero, 2 | |
| bne a3, s1, .LBB20_49 | |
| # %bb.18: # %assert_end22 | |
| lw a3, 0(t1) | |
| addi s1, zero, 100 | |
| bne a3, s1, .LBB20_50 | |
| # %bb.19: # %assert_end24 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB20_51 | |
| # %bb.20: # %assert_end26 | |
| lw a3, 16(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB20_52 | |
| # %bb.21: # %assert_end28 | |
| lhu a3, 22(a4) | |
| bne a3, s0, .LBB20_53 | |
| # %bb.22: # %assert_end28 | |
| lbu a3, 21(a4) | |
| addi a5, zero, 32 | |
| bne a3, a5, .LBB20_53 | |
| # %bb.23: # %assert_end28 | |
| lbu a3, 20(a4) | |
| addi a5, zero, 2 | |
| bne a3, a5, .LBB20_53 | |
| # %bb.24: # %assert_end30 | |
| lw a3, 0(t0) | |
| addi a5, zero, 100 | |
| bne a3, a5, .LBB20_54 | |
| # %bb.25: # %assert_end32 | |
| ld a3, 40(a4) | |
| bnez a3, .LBB20_55 | |
| # %bb.26: # %assert_end34 | |
| lw a3, 8(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB20_56 | |
| # %bb.27: # %assert_end36 | |
| lw a4, 12(a4) | |
| sext.w a3, a7 | |
| bne a3, a4, .LBB20_57 | |
| # %bb.28: # %assert_end38 | |
| lw a4, 16(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB20_58 | |
| # %bb.29: # %assert_end40 | |
| lhu a4, 22(t5) | |
| bne a4, s0, .LBB20_59 | |
| # %bb.30: # %assert_end40 | |
| lbu a4, 21(t5) | |
| addi a5, zero, 32 | |
| bne a4, a5, .LBB20_59 | |
| # %bb.31: # %assert_end40 | |
| lbu a4, 20(t5) | |
| addi a5, zero, 2 | |
| bne a4, a5, .LBB20_59 | |
| # %bb.32: # %assert_end42 | |
| lw a4, 0(a6) | |
| addi a5, zero, 100 | |
| bne a4, a5, .LBB20_60 | |
| # %bb.33: # %assert_end44 | |
| ld a4, 40(t5) | |
| bnez a4, .LBB20_61 | |
| # %bb.34: # %assert_end46 | |
| lw a4, 8(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB20_62 | |
| # %bb.35: # %assert_end48 | |
| lw a4, 12(t5) | |
| bne a3, a4, .LBB20_64 | |
| # %bb.36: # %assert_end50 | |
| call fuse_elemwise_add_compute_ | |
| mv a0, zero | |
| j .LBB20_42 | |
| .LBB20_37: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.130) | |
| addi a0, a0, %lo(.L.str.130) | |
| j .LBB20_40 | |
| .LBB20_38: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.131) | |
| addi a0, a0, %lo(.L.str.131) | |
| j .LBB20_40 | |
| .LBB20_39: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.132) | |
| addi a0, a0, %lo(.L.str.132) | |
| .LBB20_40: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB20_41: # %assert_fail1 | |
| addi a0, a0, -1 | |
| .LBB20_42: # %assert_fail1 | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| addi sp, sp, 32 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB20_43: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.129) | |
| addi a0, a0, %lo(.L.str.129) | |
| j .LBB20_40 | |
| .LBB20_44: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.52) | |
| addi a0, a0, %lo(.L.str.52) | |
| j .LBB20_63 | |
| .LBB20_45: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.53) | |
| addi a0, a0, %lo(.L.str.53) | |
| j .LBB20_63 | |
| .LBB20_46: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.23) | |
| addi a0, a0, %lo(.L.str.23) | |
| jalr a1 | |
| slli a0, s1, 32 | |
| j .LBB20_41 | |
| .LBB20_47: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB20_40 | |
| .LBB20_48: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.56) | |
| addi a0, a0, %lo(.L.str.56) | |
| j .LBB20_63 | |
| .LBB20_49: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB20_40 | |
| .LBB20_50: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.133) | |
| addi a0, a0, %lo(.L.str.133) | |
| j .LBB20_40 | |
| .LBB20_51: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB20_40 | |
| .LBB20_52: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.58) | |
| addi a0, a0, %lo(.L.str.58) | |
| j .LBB20_63 | |
| .LBB20_53: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB20_40 | |
| .LBB20_54: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.134) | |
| addi a0, a0, %lo(.L.str.134) | |
| j .LBB20_40 | |
| .LBB20_55: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB20_40 | |
| .LBB20_56: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| j .LBB20_63 | |
| .LBB20_57: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB20_40 | |
| .LBB20_58: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.36) | |
| addi a0, a0, %lo(.L.str.36) | |
| j .LBB20_63 | |
| .LBB20_59: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.37) | |
| addi a0, a0, %lo(.L.str.37) | |
| j .LBB20_40 | |
| .LBB20_60: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.135) | |
| addi a0, a0, %lo(.L.str.135) | |
| j .LBB20_40 | |
| .LBB20_61: # %assert_fail45 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.39) | |
| addi a0, a0, %lo(.L.str.39) | |
| j .LBB20_40 | |
| .LBB20_62: # %assert_fail47 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.40) | |
| addi a0, a0, %lo(.L.str.40) | |
| .LBB20_63: # %assert_fail1 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB20_41 | |
| .LBB20_64: # %assert_fail49 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.41) | |
| addi a0, a0, %lo(.L.str.41) | |
| j .LBB20_40 | |
| .Lfunc_end20: | |
| .size fuse_elemwise_add, .Lfunc_end20-fuse_elemwise_add | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_elemwise_add_compute_ # -- Begin function fuse_elemwise_add_compute_ | |
| .p2align 2 | |
| .type fuse_elemwise_add_compute_,@function | |
| fuse_elemwise_add_compute_: # @fuse_elemwise_add_compute_ | |
| # %bb.0: # %entry | |
| addi a3, zero, 8 | |
| addi a4, zero, 4 | |
| vsetvl a5, a4, a3 | |
| vle.v v0, ( a2 ) | |
| vsetvl a5, a4, a3 | |
| vle.v v1, ( a1 ) | |
| vfadd.vv v0, v0, v1 | |
| vse.v v0, ( a0 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 16 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 16 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 16 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 32 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 32 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 32 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 48 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 48 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 48 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 64 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 64 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 64 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 80 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 80 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 80 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 96 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 96 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 96 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 112 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 112 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 112 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 128 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 128 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 128 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 144 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 144 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 144 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 160 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 160 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 160 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 176 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 176 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 176 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 192 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 192 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 192 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 208 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 208 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 208 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 224 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 224 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 224 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 240 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 240 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 240 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 256 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 256 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 256 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 272 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 272 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 272 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 288 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 288 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 288 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 304 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 304 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 304 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 320 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 320 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 320 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 336 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 336 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 336 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 352 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 352 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 352 | |
| vse.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a2, 368 | |
| vle.v v0, ( a5 ) | |
| vsetvl a5, a4, a3 | |
| addi a5, a1, 368 | |
| vle.v v1, ( a5 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a5, a0, 368 | |
| vse.v v0, ( a5 ) | |
| addi a2, a2, 384 | |
| vsetvl a5, a4, a3 | |
| vle.v v0, ( a2 ) | |
| vsetvl a2, a4, a3 | |
| addi a1, a1, 384 | |
| vle.v v1, ( a1 ) | |
| vfadd.vv v0, v0, v1 | |
| addi a0, a0, 384 | |
| vse.v v0, ( a0 ) | |
| ret | |
| .Lfunc_end21: | |
| .size fuse_elemwise_add_compute_, .Lfunc_end21-fuse_elemwise_add_compute_ | |
| # -- End function | |
| .globl fuse_sigmoid # -- Begin function fuse_sigmoid | |
| .p2align 2 | |
| .type fuse_sigmoid,@function | |
| fuse_sigmoid: # @fuse_sigmoid | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| .cfi_def_cfa_offset 32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB22_30 | |
| # %bb.1: # %assert_end | |
| lwu a4, 4(a1) | |
| ld a2, 8(a0) | |
| lwu a3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t0, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB22_3 | |
| # %bb.2: # %if_then | |
| lw a0, 0(a0) | |
| addi s0, zero, 1 | |
| bne a0, s0, .LBB22_31 | |
| .LBB22_3: # %if_end | |
| ld a7, 24(a2) | |
| ld a0, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld s0, 32(a2) | |
| beqz s0, .LBB22_5 | |
| # %bb.4: # %if_then3 | |
| lw s0, 0(s0) | |
| addi s1, zero, 1 | |
| bne s0, s1, .LBB22_32 | |
| .LBB22_5: # %if_end4 | |
| addi s1, zero, 13 | |
| bltu s1, a3, .LBB22_25 | |
| # %bb.6: # %if_end4 | |
| addi s1, zero, 1 | |
| sll a3, s1, a3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB22_25 | |
| # %bb.7: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, a4, .LBB22_26 | |
| # %bb.8: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, a4 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a4, a4, s1 | |
| beqz a4, .LBB22_26 | |
| # %bb.9: # %assert_end10 | |
| bne t1, a3, .LBB22_33 | |
| # %bb.10: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB22_34 | |
| # %bb.11: # %assert_end14 | |
| lhu a3, 22(a5) | |
| bne a3, s0, .LBB22_35 | |
| # %bb.12: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB22_35 | |
| # %bb.13: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB22_35 | |
| # %bb.14: # %assert_end16 | |
| lw a3, 0(t0) | |
| addi a4, zero, 100 | |
| bne a3, a4, .LBB22_36 | |
| # %bb.15: # %assert_end18 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB22_37 | |
| # %bb.16: # %assert_end20 | |
| lw a3, 16(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB22_38 | |
| # %bb.17: # %assert_end22 | |
| lhu a3, 22(a2) | |
| bne a3, s0, .LBB22_39 | |
| # %bb.18: # %assert_end22 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB22_39 | |
| # %bb.19: # %assert_end22 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB22_39 | |
| # %bb.20: # %assert_end24 | |
| lw a3, 0(a7) | |
| addi a4, zero, 100 | |
| bne a3, a4, .LBB22_40 | |
| # %bb.21: # %assert_end26 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB22_41 | |
| # %bb.22: # %assert_end28 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB22_42 | |
| # %bb.23: # %assert_end30 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB22_44 | |
| # %bb.24: # %assert_end32 | |
| call fuse_sigmoid_compute_ | |
| mv a0, zero | |
| j .LBB22_29 | |
| .LBB22_25: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.137) | |
| addi a0, a0, %lo(.L.str.137) | |
| j .LBB22_27 | |
| .LBB22_26: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.138) | |
| addi a0, a0, %lo(.L.str.138) | |
| .LBB22_27: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB22_28: # %assert_fail1 | |
| addi a0, a0, -1 | |
| .LBB22_29: # %assert_fail1 | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| addi sp, sp, 32 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB22_30: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.136) | |
| addi a0, a0, %lo(.L.str.136) | |
| j .LBB22_27 | |
| .LBB22_31: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.52) | |
| addi a0, a0, %lo(.L.str.52) | |
| j .LBB22_43 | |
| .LBB22_32: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.53) | |
| addi a0, a0, %lo(.L.str.53) | |
| jalr a1 | |
| slli a0, s1, 32 | |
| j .LBB22_28 | |
| .LBB22_33: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB22_27 | |
| .LBB22_34: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.56) | |
| addi a0, a0, %lo(.L.str.56) | |
| j .LBB22_43 | |
| .LBB22_35: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB22_27 | |
| .LBB22_36: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.133) | |
| addi a0, a0, %lo(.L.str.133) | |
| j .LBB22_27 | |
| .LBB22_37: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB22_27 | |
| .LBB22_38: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.58) | |
| addi a0, a0, %lo(.L.str.58) | |
| j .LBB22_43 | |
| .LBB22_39: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB22_27 | |
| .LBB22_40: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.134) | |
| addi a0, a0, %lo(.L.str.134) | |
| j .LBB22_27 | |
| .LBB22_41: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB22_27 | |
| .LBB22_42: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB22_43: # %assert_fail1 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB22_28 | |
| .LBB22_44: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB22_27 | |
| .Lfunc_end22: | |
| .size fuse_sigmoid, .Lfunc_end22-fuse_sigmoid | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_sigmoid_compute_ | |
| .LCPI23_0: | |
| .word 0 # float 0 | |
| .LCPI23_1: | |
| .word 1065353216 # float 1 | |
| .text | |
| .globl fuse_sigmoid_compute_ | |
| .p2align 2 | |
| .type fuse_sigmoid_compute_,@function | |
| fuse_sigmoid_compute_: # @fuse_sigmoid_compute_ | |
| # %bb.0: # %entry | |
| addi sp, sp, -48 | |
| sd ra, 40(sp) | |
| sd s0, 32(sp) | |
| sd s1, 24(sp) | |
| sd s2, 16(sp) | |
| sd s3, 8(sp) | |
| mv s3, a1 | |
| mv s1, a0 | |
| lui a0, %hi(.LCPI23_0) | |
| addi a0, a0, %lo(.LCPI23_0) | |
| flw ft0, 0(a0) | |
| fsw ft0, 4(sp) | |
| lui a0, %hi(.LCPI23_1) | |
| addi a0, a0, %lo(.LCPI23_1) | |
| flw ft0, 0(a0) | |
| fsw ft0, 0(sp) | |
| addi s2, zero, 400 | |
| mv s0, zero | |
| .LBB23_1: # %for_body | |
| # =>This Inner Loop Header: Depth=1 | |
| add a0, s3, s0 | |
| flw ft0, 0(a0) | |
| flw ft1, 4(sp) | |
| fsub.s ft0, ft1, ft0 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| fmv.w.x ft0, a0 | |
| flw ft1, 0(sp) | |
| fadd.s ft0, ft0, ft1 | |
| fdiv.s ft0, ft1, ft0 | |
| add a0, s1, s0 | |
| fsw ft0, 0(a0) | |
| addi s0, s0, 4 | |
| bne s0, s2, .LBB23_1 | |
| # %bb.2: # %for_end | |
| ld s3, 8(sp) | |
| ld s2, 16(sp) | |
| ld s1, 24(sp) | |
| ld s0, 32(sp) | |
| ld ra, 40(sp) | |
| addi sp, sp, 48 | |
| ret | |
| .Lfunc_end23: | |
| .size fuse_sigmoid_compute_, .Lfunc_end23-fuse_sigmoid_compute_ | |
| # -- End function | |
| .globl fuse_matmul_1 # -- Begin function fuse_matmul_1 | |
| .p2align 2 | |
| .type fuse_matmul_1,@function | |
| fuse_matmul_1: # @fuse_matmul_1 | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| .cfi_def_cfa_offset 32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 3 | |
| bne a2, a3, .LBB24_49 | |
| # %bb.1: # %assert_end | |
| lwu t2, 8(a1) | |
| ld t5, 16(a0) | |
| lwu t3, 4(a1) | |
| ld a4, 8(a0) | |
| lwu t6, 0(a1) | |
| ld a5, 0(a0) | |
| ld t1, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB24_4 | |
| # %bb.2: # %if_then | |
| lw a2, 0(a0) | |
| addi s0, zero, 100 | |
| bne a2, s0, .LBB24_50 | |
| # %bb.3: # %if_then | |
| ld a0, 8(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a2, zero, 1 | |
| bne a0, a2, .LBB24_50 | |
| .LBB24_4: # %if_end | |
| ld t0, 24(a4) | |
| ld a2, 0(a4) | |
| lwu a6, 12(a5) | |
| lwu t4, 8(a5) | |
| ld a0, 32(a4) | |
| beqz a0, .LBB24_7 | |
| # %bb.5: # %if_then3 | |
| lw s0, 0(a0) | |
| addi a3, zero, 10 | |
| bne s0, a3, .LBB24_51 | |
| # %bb.6: # %if_then3 | |
| ld a0, 8(a0) | |
| slli a0, a0, 32 | |
| srli a0, a0, 32 | |
| addi a3, zero, 1 | |
| bne a0, a3, .LBB24_51 | |
| .LBB24_7: # %if_end4 | |
| ld a7, 24(t5) | |
| ld a0, 0(t5) | |
| ld s0, 32(t5) | |
| beqz s0, .LBB24_10 | |
| # %bb.8: # %if_then7 | |
| lw a3, 0(s0) | |
| addi s1, zero, 10 | |
| bne a3, s1, .LBB24_52 | |
| # %bb.9: # %if_then7 | |
| ld a3, 8(s0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB24_52 | |
| .LBB24_10: # %if_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t6, .LBB24_43 | |
| # %bb.11: # %if_end8 | |
| addi a3, zero, 1 | |
| sll a3, a3, t6 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB24_43 | |
| # %bb.12: # %assert_end12 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB24_44 | |
| # %bb.13: # %assert_end12 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB24_44 | |
| # %bb.14: # %assert_end14 | |
| addi a3, zero, 13 | |
| bltu a3, t2, .LBB24_45 | |
| # %bb.15: # %assert_end14 | |
| addi a3, zero, 1 | |
| sll s1, a3, t2 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and s1, s1, s0 | |
| beqz s1, .LBB24_45 | |
| # %bb.16: # %assert_end16 | |
| bne t4, a3, .LBB24_53 | |
| # %bb.17: # %assert_end18 | |
| lw a3, 16(a5) | |
| addi s1, zero, 2 | |
| bne a3, s1, .LBB24_54 | |
| # %bb.18: # %assert_end20 | |
| lhu a3, 22(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB24_55 | |
| # %bb.19: # %assert_end20 | |
| lbu a3, 21(a5) | |
| addi s1, zero, 32 | |
| bne a3, s1, .LBB24_55 | |
| # %bb.20: # %assert_end20 | |
| lbu a3, 20(a5) | |
| addi s1, zero, 2 | |
| bne a3, s1, .LBB24_55 | |
| # %bb.21: # %assert_end22 | |
| lw a3, 0(t1) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB24_56 | |
| # %bb.22: # %assert_end24 | |
| lw a3, 8(t1) | |
| addi s1, zero, 100 | |
| bne a3, s1, .LBB24_57 | |
| # %bb.23: # %assert_end26 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB24_58 | |
| # %bb.24: # %assert_end28 | |
| lw a3, 16(a4) | |
| addi a5, zero, 2 | |
| bne a3, a5, .LBB24_59 | |
| # %bb.25: # %assert_end30 | |
| lhu a3, 22(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB24_60 | |
| # %bb.26: # %assert_end30 | |
| lbu a3, 21(a4) | |
| addi a5, zero, 32 | |
| bne a3, a5, .LBB24_60 | |
| # %bb.27: # %assert_end30 | |
| lbu a3, 20(a4) | |
| addi a5, zero, 2 | |
| bne a3, a5, .LBB24_60 | |
| # %bb.28: # %assert_end32 | |
| lw a3, 0(t0) | |
| addi a5, zero, 100 | |
| bne a3, a5, .LBB24_61 | |
| # %bb.29: # %assert_end34 | |
| lw a3, 8(t0) | |
| addi a5, zero, 10 | |
| bne a3, a5, .LBB24_62 | |
| # %bb.30: # %assert_end36 | |
| ld a3, 40(a4) | |
| bnez a3, .LBB24_63 | |
| # %bb.31: # %assert_end38 | |
| lw a3, 8(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB24_64 | |
| # %bb.32: # %assert_end40 | |
| lw a4, 12(a4) | |
| sext.w a3, a6 | |
| bne a3, a4, .LBB24_65 | |
| # %bb.33: # %assert_end42 | |
| lw a4, 16(t5) | |
| addi a5, zero, 2 | |
| bne a4, a5, .LBB24_66 | |
| # %bb.34: # %assert_end44 | |
| lhu a4, 22(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB24_67 | |
| # %bb.35: # %assert_end44 | |
| lbu a4, 21(t5) | |
| addi a5, zero, 32 | |
| bne a4, a5, .LBB24_67 | |
| # %bb.36: # %assert_end44 | |
| lbu a4, 20(t5) | |
| addi a5, zero, 2 | |
| bne a4, a5, .LBB24_67 | |
| # %bb.37: # %assert_end46 | |
| lw a4, 0(a7) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB24_68 | |
| # %bb.38: # %assert_end48 | |
| lw a4, 8(a7) | |
| addi a5, zero, 10 | |
| bne a4, a5, .LBB24_69 | |
| # %bb.39: # %assert_end50 | |
| ld a4, 40(t5) | |
| bnez a4, .LBB24_70 | |
| # %bb.40: # %assert_end52 | |
| lw a4, 8(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB24_71 | |
| # %bb.41: # %assert_end54 | |
| lw a4, 12(t5) | |
| bne a3, a4, .LBB24_73 | |
| # %bb.42: # %assert_end56 | |
| call fuse_matmul_1_compute_ | |
| mv a0, zero | |
| j .LBB24_48 | |
| .LBB24_43: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.143) | |
| addi a0, a0, %lo(.L.str.143) | |
| j .LBB24_46 | |
| .LBB24_44: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.144) | |
| addi a0, a0, %lo(.L.str.144) | |
| j .LBB24_46 | |
| .LBB24_45: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.145) | |
| addi a0, a0, %lo(.L.str.145) | |
| .LBB24_46: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB24_47: # %assert_fail21 | |
| addi a0, a0, -1 | |
| .LBB24_48: # %assert_fail21 | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| addi sp, sp, 32 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB24_49: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.139) | |
| addi a0, a0, %lo(.L.str.139) | |
| j .LBB24_46 | |
| .LBB24_50: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.140) | |
| addi a0, a0, %lo(.L.str.140) | |
| j .LBB24_46 | |
| .LBB24_51: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.141) | |
| addi a0, a0, %lo(.L.str.141) | |
| j .LBB24_46 | |
| .LBB24_52: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.142) | |
| addi a0, a0, %lo(.L.str.142) | |
| j .LBB24_46 | |
| .LBB24_53: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB24_46 | |
| .LBB24_54: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.6) | |
| addi a0, a0, %lo(.L.str.6) | |
| j .LBB24_46 | |
| .LBB24_55: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB24_72 | |
| .LBB24_56: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB24_72 | |
| .LBB24_57: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.146) | |
| addi a0, a0, %lo(.L.str.146) | |
| j .LBB24_46 | |
| .LBB24_58: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB24_46 | |
| .LBB24_59: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.114) | |
| addi a0, a0, %lo(.L.str.114) | |
| j .LBB24_46 | |
| .LBB24_60: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB24_72 | |
| .LBB24_61: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.134) | |
| addi a0, a0, %lo(.L.str.134) | |
| j .LBB24_46 | |
| .LBB24_62: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.147) | |
| addi a0, a0, %lo(.L.str.147) | |
| j .LBB24_46 | |
| .LBB24_63: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB24_46 | |
| .LBB24_64: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| j .LBB24_72 | |
| .LBB24_65: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB24_46 | |
| .LBB24_66: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.126) | |
| addi a0, a0, %lo(.L.str.126) | |
| j .LBB24_46 | |
| .LBB24_67: # %assert_fail45 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.37) | |
| addi a0, a0, %lo(.L.str.37) | |
| j .LBB24_72 | |
| .LBB24_68: # %assert_fail47 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.127) | |
| addi a0, a0, %lo(.L.str.127) | |
| j .LBB24_72 | |
| .LBB24_69: # %assert_fail49 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.148) | |
| addi a0, a0, %lo(.L.str.148) | |
| j .LBB24_46 | |
| .LBB24_70: # %assert_fail51 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.39) | |
| addi a0, a0, %lo(.L.str.39) | |
| j .LBB24_46 | |
| .LBB24_71: # %assert_fail53 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.40) | |
| addi a0, a0, %lo(.L.str.40) | |
| .LBB24_72: # %assert_fail21 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB24_47 | |
| .LBB24_73: # %assert_fail55 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.41) | |
| addi a0, a0, %lo(.L.str.41) | |
| j .LBB24_46 | |
| .Lfunc_end24: | |
| .size fuse_matmul_1, .Lfunc_end24-fuse_matmul_1 | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_matmul_1_compute_ | |
| .LCPI25_0: | |
| .word 0 # float 0 | |
| .text | |
| .globl fuse_matmul_1_compute_ | |
| .p2align 2 | |
| .type fuse_matmul_1_compute_,@function | |
| fuse_matmul_1_compute_: # @fuse_matmul_1_compute_ | |
| # %bb.0: # %entry | |
| sw zero, 0(a0) | |
| lui a3, %hi(.LCPI25_0) | |
| addi a3, a3, %lo(.LCPI25_0) | |
| flw ft0, 0(a3) | |
| addi a6, zero, 400 | |
| mv a4, a2 | |
| mv a5, zero | |
| .LBB25_1: # %for_body2 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a3, a1, a5 | |
| flw ft1, 0(a3) | |
| flw ft2, 0(a4) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a4, a4, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_1 | |
| # %bb.2: # %for_end3 | |
| fsw ft0, 0(a0) | |
| sw zero, 4(a0) | |
| addi a3, a2, 4 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_3: # %for_body2.1 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_3 | |
| # %bb.4: # %for_end3.1 | |
| fsw ft0, 4(a0) | |
| sw zero, 8(a0) | |
| addi a3, a2, 8 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_5: # %for_body2.2 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_5 | |
| # %bb.6: # %for_end3.2 | |
| fsw ft0, 8(a0) | |
| sw zero, 12(a0) | |
| addi a3, a2, 12 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_7: # %for_body2.3 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_7 | |
| # %bb.8: # %for_end3.3 | |
| fsw ft0, 12(a0) | |
| sw zero, 16(a0) | |
| addi a3, a2, 16 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_9: # %for_body2.4 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_9 | |
| # %bb.10: # %for_end3.4 | |
| fsw ft0, 16(a0) | |
| sw zero, 20(a0) | |
| addi a3, a2, 20 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_11: # %for_body2.5 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_11 | |
| # %bb.12: # %for_end3.5 | |
| fsw ft0, 20(a0) | |
| sw zero, 24(a0) | |
| addi a3, a2, 24 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_13: # %for_body2.6 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_13 | |
| # %bb.14: # %for_end3.6 | |
| fsw ft0, 24(a0) | |
| sw zero, 28(a0) | |
| addi a3, a2, 28 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_15: # %for_body2.7 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_15 | |
| # %bb.16: # %for_end3.7 | |
| fsw ft0, 28(a0) | |
| sw zero, 32(a0) | |
| addi a3, a2, 32 | |
| lui a4, %hi(.LCPI25_0) | |
| addi a4, a4, %lo(.LCPI25_0) | |
| flw ft0, 0(a4) | |
| addi a6, zero, 400 | |
| mv a5, zero | |
| .LBB25_17: # %for_body2.8 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a4, a1, a5 | |
| flw ft1, 0(a4) | |
| flw ft2, 0(a3) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a3, a3, 40 | |
| addi a5, a5, 4 | |
| bne a5, a6, .LBB25_17 | |
| # %bb.18: # %for_end3.8 | |
| fsw ft0, 32(a0) | |
| sw zero, 36(a0) | |
| addi a2, a2, 36 | |
| lui a3, %hi(.LCPI25_0) | |
| addi a3, a3, %lo(.LCPI25_0) | |
| flw ft0, 0(a3) | |
| addi a3, zero, 400 | |
| mv a4, zero | |
| .LBB25_19: # %for_body2.9 | |
| # =>This Inner Loop Header: Depth=1 | |
| add a5, a1, a4 | |
| flw ft1, 0(a5) | |
| flw ft2, 0(a2) | |
| fmul.s ft1, ft1, ft2 | |
| fadd.s ft0, ft1, ft0 | |
| addi a2, a2, 40 | |
| addi a4, a4, 4 | |
| bne a4, a3, .LBB25_19 | |
| # %bb.20: # %for_end3.9 | |
| fsw ft0, 36(a0) | |
| ret | |
| .Lfunc_end25: | |
| .size fuse_matmul_1_compute_, .Lfunc_end25-fuse_matmul_1_compute_ | |
| # -- End function | |
| .globl fuse_elemwise_add_1 # -- Begin function fuse_elemwise_add_1 | |
| .p2align 2 | |
| .type fuse_elemwise_add_1,@function | |
| fuse_elemwise_add_1: # @fuse_elemwise_add_1 | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -32 | |
| .cfi_def_cfa_offset 32 | |
| sd ra, 24(sp) | |
| sd s0, 16(sp) | |
| sd s1, 8(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| .cfi_offset s1, -24 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 3 | |
| bne a2, a3, .LBB26_43 | |
| # %bb.1: # %assert_end | |
| lwu t2, 8(a1) | |
| ld t5, 16(a0) | |
| lwu t3, 4(a1) | |
| ld a4, 8(a0) | |
| lwu a3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t1, 24(a5) | |
| ld a1, 0(a5) | |
| ld a0, 32(a5) | |
| beqz a0, .LBB26_3 | |
| # %bb.2: # %if_then | |
| lw a0, 0(a0) | |
| addi s0, zero, 1 | |
| bne a0, s0, .LBB26_44 | |
| .LBB26_3: # %if_end | |
| ld t0, 24(a4) | |
| ld a2, 0(a4) | |
| lwu a7, 12(a5) | |
| lwu t4, 8(a5) | |
| ld a0, 32(a4) | |
| beqz a0, .LBB26_5 | |
| # %bb.4: # %if_then3 | |
| lw a0, 0(a0) | |
| addi s0, zero, 1 | |
| bne a0, s0, .LBB26_45 | |
| .LBB26_5: # %if_end4 | |
| ld a6, 24(t5) | |
| ld a0, 0(t5) | |
| ld s0, 32(t5) | |
| beqz s0, .LBB26_7 | |
| # %bb.6: # %if_then7 | |
| lw s0, 0(s0) | |
| addi s1, zero, 1 | |
| bne s0, s1, .LBB26_46 | |
| .LBB26_7: # %if_end8 | |
| addi s1, zero, 13 | |
| bltu s1, a3, .LBB26_37 | |
| # %bb.8: # %if_end8 | |
| addi s1, zero, 1 | |
| sll a3, s1, a3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB26_37 | |
| # %bb.9: # %assert_end12 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB26_38 | |
| # %bb.10: # %assert_end12 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui s1, 2 | |
| addiw s1, s1, 152 | |
| and a3, a3, s1 | |
| beqz a3, .LBB26_38 | |
| # %bb.11: # %assert_end14 | |
| addi a3, zero, 13 | |
| bltu a3, t2, .LBB26_39 | |
| # %bb.12: # %assert_end14 | |
| addi a3, zero, 1 | |
| sll s1, a3, t2 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and s1, s1, s0 | |
| beqz s1, .LBB26_39 | |
| # %bb.13: # %assert_end16 | |
| bne t4, a3, .LBB26_47 | |
| # %bb.14: # %assert_end18 | |
| lw a3, 16(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB26_48 | |
| # %bb.15: # %assert_end20 | |
| lhu a3, 22(a5) | |
| bne a3, s0, .LBB26_49 | |
| # %bb.16: # %assert_end20 | |
| lbu a3, 21(a5) | |
| addi s1, zero, 32 | |
| bne a3, s1, .LBB26_49 | |
| # %bb.17: # %assert_end20 | |
| lbu a3, 20(a5) | |
| addi s1, zero, 2 | |
| bne a3, s1, .LBB26_49 | |
| # %bb.18: # %assert_end22 | |
| lw a3, 0(t1) | |
| addi s1, zero, 10 | |
| bne a3, s1, .LBB26_50 | |
| # %bb.19: # %assert_end24 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB26_51 | |
| # %bb.20: # %assert_end26 | |
| lw a3, 16(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB26_52 | |
| # %bb.21: # %assert_end28 | |
| lhu a3, 22(a4) | |
| bne a3, s0, .LBB26_53 | |
| # %bb.22: # %assert_end28 | |
| lbu a3, 21(a4) | |
| addi a5, zero, 32 | |
| bne a3, a5, .LBB26_53 | |
| # %bb.23: # %assert_end28 | |
| lbu a3, 20(a4) | |
| addi a5, zero, 2 | |
| bne a3, a5, .LBB26_53 | |
| # %bb.24: # %assert_end30 | |
| lw a3, 0(t0) | |
| addi a5, zero, 10 | |
| bne a3, a5, .LBB26_54 | |
| # %bb.25: # %assert_end32 | |
| ld a3, 40(a4) | |
| bnez a3, .LBB26_55 | |
| # %bb.26: # %assert_end34 | |
| lw a3, 8(a4) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB26_56 | |
| # %bb.27: # %assert_end36 | |
| lw a4, 12(a4) | |
| sext.w a3, a7 | |
| bne a3, a4, .LBB26_57 | |
| # %bb.28: # %assert_end38 | |
| lw a4, 16(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB26_58 | |
| # %bb.29: # %assert_end40 | |
| lhu a4, 22(t5) | |
| bne a4, s0, .LBB26_59 | |
| # %bb.30: # %assert_end40 | |
| lbu a4, 21(t5) | |
| addi a5, zero, 32 | |
| bne a4, a5, .LBB26_59 | |
| # %bb.31: # %assert_end40 | |
| lbu a4, 20(t5) | |
| addi a5, zero, 2 | |
| bne a4, a5, .LBB26_59 | |
| # %bb.32: # %assert_end42 | |
| lw a4, 0(a6) | |
| addi a5, zero, 10 | |
| bne a4, a5, .LBB26_60 | |
| # %bb.33: # %assert_end44 | |
| ld a4, 40(t5) | |
| bnez a4, .LBB26_61 | |
| # %bb.34: # %assert_end46 | |
| lw a4, 8(t5) | |
| addi s0, zero, 1 | |
| bne a4, s0, .LBB26_62 | |
| # %bb.35: # %assert_end48 | |
| lw a4, 12(t5) | |
| bne a3, a4, .LBB26_64 | |
| # %bb.36: # %assert_end50 | |
| call fuse_elemwise_add_1_compute_ | |
| mv a0, zero | |
| j .LBB26_42 | |
| .LBB26_37: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.150) | |
| addi a0, a0, %lo(.L.str.150) | |
| j .LBB26_40 | |
| .LBB26_38: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.151) | |
| addi a0, a0, %lo(.L.str.151) | |
| j .LBB26_40 | |
| .LBB26_39: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.152) | |
| addi a0, a0, %lo(.L.str.152) | |
| .LBB26_40: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB26_41: # %assert_fail1 | |
| addi a0, a0, -1 | |
| .LBB26_42: # %assert_fail1 | |
| ld s1, 8(sp) | |
| ld s0, 16(sp) | |
| ld ra, 24(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| .cfi_restore s1 | |
| addi sp, sp, 32 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB26_43: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.149) | |
| addi a0, a0, %lo(.L.str.149) | |
| j .LBB26_40 | |
| .LBB26_44: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.52) | |
| addi a0, a0, %lo(.L.str.52) | |
| j .LBB26_63 | |
| .LBB26_45: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.53) | |
| addi a0, a0, %lo(.L.str.53) | |
| j .LBB26_63 | |
| .LBB26_46: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.23) | |
| addi a0, a0, %lo(.L.str.23) | |
| jalr a1 | |
| slli a0, s1, 32 | |
| j .LBB26_41 | |
| .LBB26_47: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB26_40 | |
| .LBB26_48: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.56) | |
| addi a0, a0, %lo(.L.str.56) | |
| j .LBB26_63 | |
| .LBB26_49: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB26_40 | |
| .LBB26_50: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.153) | |
| addi a0, a0, %lo(.L.str.153) | |
| j .LBB26_40 | |
| .LBB26_51: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB26_40 | |
| .LBB26_52: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.58) | |
| addi a0, a0, %lo(.L.str.58) | |
| j .LBB26_63 | |
| .LBB26_53: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB26_40 | |
| .LBB26_54: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.154) | |
| addi a0, a0, %lo(.L.str.154) | |
| j .LBB26_40 | |
| .LBB26_55: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB26_40 | |
| .LBB26_56: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| j .LBB26_63 | |
| .LBB26_57: # %assert_fail37 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB26_40 | |
| .LBB26_58: # %assert_fail39 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.36) | |
| addi a0, a0, %lo(.L.str.36) | |
| j .LBB26_63 | |
| .LBB26_59: # %assert_fail41 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.37) | |
| addi a0, a0, %lo(.L.str.37) | |
| j .LBB26_40 | |
| .LBB26_60: # %assert_fail43 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.155) | |
| addi a0, a0, %lo(.L.str.155) | |
| j .LBB26_40 | |
| .LBB26_61: # %assert_fail45 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.39) | |
| addi a0, a0, %lo(.L.str.39) | |
| j .LBB26_40 | |
| .LBB26_62: # %assert_fail47 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.40) | |
| addi a0, a0, %lo(.L.str.40) | |
| .LBB26_63: # %assert_fail1 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB26_41 | |
| .LBB26_64: # %assert_fail49 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.41) | |
| addi a0, a0, %lo(.L.str.41) | |
| j .LBB26_40 | |
| .Lfunc_end26: | |
| .size fuse_elemwise_add_1, .Lfunc_end26-fuse_elemwise_add_1 | |
| .cfi_endproc | |
| # -- End function | |
| .globl fuse_elemwise_add_1_compute_ # -- Begin function fuse_elemwise_add_1_compute_ | |
| .p2align 2 | |
| .type fuse_elemwise_add_1_compute_,@function | |
| fuse_elemwise_add_1_compute_: # @fuse_elemwise_add_1_compute_ | |
| # %bb.0: # %entry | |
| flw ft0, 0(a1) | |
| flw ft1, 0(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 0(a0) | |
| flw ft0, 4(a1) | |
| flw ft1, 4(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 4(a0) | |
| flw ft0, 8(a1) | |
| flw ft1, 8(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 8(a0) | |
| flw ft0, 12(a1) | |
| flw ft1, 12(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 12(a0) | |
| flw ft0, 16(a1) | |
| flw ft1, 16(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 16(a0) | |
| flw ft0, 20(a1) | |
| flw ft1, 20(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 20(a0) | |
| flw ft0, 24(a1) | |
| flw ft1, 24(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 24(a0) | |
| flw ft0, 28(a1) | |
| flw ft1, 28(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 28(a0) | |
| flw ft0, 32(a1) | |
| flw ft1, 32(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 32(a0) | |
| flw ft0, 36(a1) | |
| flw ft1, 36(a2) | |
| fadd.s ft0, ft1, ft0 | |
| fsw ft0, 36(a0) | |
| ret | |
| .Lfunc_end27: | |
| .size fuse_elemwise_add_1_compute_, .Lfunc_end27-fuse_elemwise_add_1_compute_ | |
| # -- End function | |
| .globl fuse_softmax # -- Begin function fuse_softmax | |
| .p2align 2 | |
| .type fuse_softmax,@function | |
| fuse_softmax: # @fuse_softmax | |
| .cfi_startproc | |
| # %bb.0: # %entry | |
| addi sp, sp, -16 | |
| .cfi_def_cfa_offset 16 | |
| sd ra, 8(sp) | |
| sd s0, 0(sp) | |
| .cfi_offset ra, -8 | |
| .cfi_offset s0, -16 | |
| slli a2, a2, 32 | |
| srli a2, a2, 32 | |
| addi a3, zero, 2 | |
| bne a2, a3, .LBB28_34 | |
| # %bb.1: # %assert_end | |
| lwu t2, 4(a1) | |
| ld a2, 8(a0) | |
| lwu t3, 0(a1) | |
| ld a5, 0(a0) | |
| ld t0, 24(a5) | |
| ld a0, 0(a5) | |
| ld a1, 32(a5) | |
| beqz a1, .LBB28_4 | |
| # %bb.2: # %if_then | |
| lw s0, 0(a1) | |
| addi a4, zero, 10 | |
| bne s0, a4, .LBB28_35 | |
| # %bb.3: # %if_then | |
| ld a1, 8(a1) | |
| slli a1, a1, 32 | |
| srli a1, a1, 32 | |
| addi a4, zero, 1 | |
| bne a1, a4, .LBB28_35 | |
| .LBB28_4: # %if_end | |
| ld a7, 24(a2) | |
| ld a1, 0(a2) | |
| lwu a6, 12(a5) | |
| lwu t1, 8(a5) | |
| ld s0, 32(a2) | |
| beqz s0, .LBB28_7 | |
| # %bb.5: # %if_then3 | |
| lw a4, 0(s0) | |
| addi a3, zero, 10 | |
| bne a4, a3, .LBB28_36 | |
| # %bb.6: # %if_then3 | |
| ld a3, 8(s0) | |
| slli a3, a3, 32 | |
| srli a3, a3, 32 | |
| addi a4, zero, 1 | |
| bne a3, a4, .LBB28_36 | |
| .LBB28_7: # %if_end4 | |
| addi a3, zero, 13 | |
| bltu a3, t3, .LBB28_29 | |
| # %bb.8: # %if_end4 | |
| addi a3, zero, 1 | |
| sll a3, a3, t3 | |
| lui a4, 2 | |
| addiw a4, a4, 152 | |
| and a3, a3, a4 | |
| beqz a3, .LBB28_29 | |
| # %bb.9: # %assert_end8 | |
| addi a3, zero, 13 | |
| bltu a3, t2, .LBB28_30 | |
| # %bb.10: # %assert_end8 | |
| addi a3, zero, 1 | |
| sll a4, a3, t2 | |
| lui s0, 2 | |
| addiw s0, s0, 152 | |
| and a4, a4, s0 | |
| beqz a4, .LBB28_30 | |
| # %bb.11: # %assert_end10 | |
| bne t1, a3, .LBB28_37 | |
| # %bb.12: # %assert_end12 | |
| lw a3, 16(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB28_38 | |
| # %bb.13: # %assert_end14 | |
| lhu a3, 22(a5) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB28_39 | |
| # %bb.14: # %assert_end14 | |
| lbu a3, 21(a5) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB28_39 | |
| # %bb.15: # %assert_end14 | |
| lbu a3, 20(a5) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB28_39 | |
| # %bb.16: # %assert_end16 | |
| lw a3, 0(t0) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB28_40 | |
| # %bb.17: # %assert_end18 | |
| lw a3, 8(t0) | |
| addi a4, zero, 10 | |
| bne a3, a4, .LBB28_41 | |
| # %bb.18: # %assert_end20 | |
| ld a3, 40(a5) | |
| bnez a3, .LBB28_42 | |
| # %bb.19: # %assert_end22 | |
| lw a3, 16(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB28_43 | |
| # %bb.20: # %assert_end24 | |
| lhu a3, 22(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB28_44 | |
| # %bb.21: # %assert_end24 | |
| lbu a3, 21(a2) | |
| addi a4, zero, 32 | |
| bne a3, a4, .LBB28_44 | |
| # %bb.22: # %assert_end24 | |
| lbu a3, 20(a2) | |
| addi a4, zero, 2 | |
| bne a3, a4, .LBB28_44 | |
| # %bb.23: # %assert_end26 | |
| lw a3, 0(a7) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB28_45 | |
| # %bb.24: # %assert_end28 | |
| lw a3, 8(a7) | |
| addi a4, zero, 10 | |
| bne a3, a4, .LBB28_46 | |
| # %bb.25: # %assert_end30 | |
| ld a3, 40(a2) | |
| bnez a3, .LBB28_47 | |
| # %bb.26: # %assert_end32 | |
| lw a3, 8(a2) | |
| addi s0, zero, 1 | |
| bne a3, s0, .LBB28_48 | |
| # %bb.27: # %assert_end34 | |
| lw a2, 12(a2) | |
| sext.w a3, a6 | |
| bne a3, a2, .LBB28_50 | |
| # %bb.28: # %assert_end36 | |
| call fuse_softmax_compute_ | |
| mv a0, zero | |
| j .LBB28_33 | |
| .LBB28_29: # %assert_fail7 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.158) | |
| addi a0, a0, %lo(.L.str.158) | |
| j .LBB28_31 | |
| .LBB28_30: # %assert_fail9 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.159) | |
| addi a0, a0, %lo(.L.str.159) | |
| .LBB28_31: # %assert_fail | |
| jalr a1 | |
| addi a0, zero, 1 | |
| slli a0, a0, 32 | |
| .LBB28_32: # %assert_fail15 | |
| addi a0, a0, -1 | |
| .LBB28_33: # %assert_fail15 | |
| ld s0, 0(sp) | |
| ld ra, 8(sp) | |
| .cfi_restore ra | |
| .cfi_restore s0 | |
| addi sp, sp, 16 | |
| .cfi_def_cfa_offset 0 | |
| ret | |
| .LBB28_34: # %assert_fail | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.156) | |
| addi a0, a0, %lo(.L.str.156) | |
| j .LBB28_31 | |
| .LBB28_35: # %assert_fail1 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.157) | |
| addi a0, a0, %lo(.L.str.157) | |
| j .LBB28_31 | |
| .LBB28_36: # %assert_fail5 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.141) | |
| addi a0, a0, %lo(.L.str.141) | |
| j .LBB28_31 | |
| .LBB28_37: # %assert_fail11 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.5) | |
| addi a0, a0, %lo(.L.str.5) | |
| j .LBB28_31 | |
| .LBB28_38: # %assert_fail13 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.6) | |
| addi a0, a0, %lo(.L.str.6) | |
| j .LBB28_31 | |
| .LBB28_39: # %assert_fail15 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.7) | |
| addi a0, a0, %lo(.L.str.7) | |
| j .LBB28_49 | |
| .LBB28_40: # %assert_fail17 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.8) | |
| addi a0, a0, %lo(.L.str.8) | |
| j .LBB28_49 | |
| .LBB28_41: # %assert_fail19 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.160) | |
| addi a0, a0, %lo(.L.str.160) | |
| j .LBB28_31 | |
| .LBB28_42: # %assert_fail21 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.10) | |
| addi a0, a0, %lo(.L.str.10) | |
| j .LBB28_31 | |
| .LBB28_43: # %assert_fail23 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.114) | |
| addi a0, a0, %lo(.L.str.114) | |
| j .LBB28_31 | |
| .LBB28_44: # %assert_fail25 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.12) | |
| addi a0, a0, %lo(.L.str.12) | |
| j .LBB28_49 | |
| .LBB28_45: # %assert_fail27 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.13) | |
| addi a0, a0, %lo(.L.str.13) | |
| j .LBB28_49 | |
| .LBB28_46: # %assert_fail29 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.147) | |
| addi a0, a0, %lo(.L.str.147) | |
| j .LBB28_31 | |
| .LBB28_47: # %assert_fail31 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.17) | |
| addi a0, a0, %lo(.L.str.17) | |
| j .LBB28_31 | |
| .LBB28_48: # %assert_fail33 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.18) | |
| addi a0, a0, %lo(.L.str.18) | |
| .LBB28_49: # %assert_fail15 | |
| jalr a1 | |
| slli a0, s0, 32 | |
| j .LBB28_32 | |
| .LBB28_50: # %assert_fail35 | |
| lui a0, %hi(__TVMAPISetLastError) | |
| ld a1, %lo(__TVMAPISetLastError)(a0) | |
| lui a0, %hi(.L.str.19) | |
| addi a0, a0, %lo(.L.str.19) | |
| j .LBB28_31 | |
| .Lfunc_end28: | |
| .size fuse_softmax, .Lfunc_end28-fuse_softmax | |
| .cfi_endproc | |
| # -- End function | |
| .section .sdata,"aw",@progbits | |
| .p2align 2 # -- Begin function fuse_softmax_compute_ | |
| .LCPI29_0: | |
| .word 4286578687 # float -3.40282347E+38 | |
| .LCPI29_1: | |
| .word 0 # float 0 | |
| .text | |
| .globl fuse_softmax_compute_ | |
| .p2align 2 | |
| .type fuse_softmax_compute_,@function | |
| fuse_softmax_compute_: # @fuse_softmax_compute_ | |
| # %bb.0: # %entry | |
| addi sp, sp, -128 | |
| sd ra, 120(sp) | |
| sd s0, 112(sp) | |
| sd s1, 104(sp) | |
| sd s2, 96(sp) | |
| sd s3, 88(sp) | |
| sd s4, 80(sp) | |
| sd s5, 72(sp) | |
| sd s6, 64(sp) | |
| sd s7, 56(sp) | |
| sd s8, 48(sp) | |
| sd s9, 40(sp) | |
| mv s0, a1 | |
| lui a1, %hi(.LCPI29_0) | |
| addi a1, a1, %lo(.LCPI29_0) | |
| flw ft1, 0(a1) | |
| flw ft0, 0(a0) | |
| flt.s a1, ft0, ft1 | |
| bnez a1, .LBB29_2 | |
| # %bb.1: # %entry | |
| fmv.s ft1, ft0 | |
| .LBB29_2: # %entry | |
| flw ft2, 4(a0) | |
| flt.s a1, ft2, ft1 | |
| bnez a1, .LBB29_4 | |
| # %bb.3: # %entry | |
| fmv.s ft1, ft2 | |
| .LBB29_4: # %entry | |
| flw ft3, 8(a0) | |
| flt.s a1, ft3, ft1 | |
| bnez a1, .LBB29_6 | |
| # %bb.5: # %entry | |
| fmv.s ft1, ft3 | |
| .LBB29_6: # %entry | |
| flw ft4, 12(a0) | |
| flt.s a1, ft4, ft1 | |
| bnez a1, .LBB29_8 | |
| # %bb.7: # %entry | |
| fmv.s ft1, ft4 | |
| .LBB29_8: # %entry | |
| flw ft5, 16(a0) | |
| flt.s a1, ft5, ft1 | |
| bnez a1, .LBB29_10 | |
| # %bb.9: # %entry | |
| fmv.s ft1, ft5 | |
| .LBB29_10: # %entry | |
| flw ft6, 20(a0) | |
| flt.s a1, ft6, ft1 | |
| bnez a1, .LBB29_12 | |
| # %bb.11: # %entry | |
| fmv.s ft1, ft6 | |
| .LBB29_12: # %entry | |
| flw ft7, 24(a0) | |
| flt.s a1, ft7, ft1 | |
| bnez a1, .LBB29_14 | |
| # %bb.13: # %entry | |
| fmv.s ft1, ft7 | |
| .LBB29_14: # %entry | |
| flw fa0, 28(a0) | |
| flt.s a1, fa0, ft1 | |
| bnez a1, .LBB29_16 | |
| # %bb.15: # %entry | |
| fmv.s ft1, fa0 | |
| .LBB29_16: # %entry | |
| flw fa1, 32(a0) | |
| flt.s a1, fa1, ft1 | |
| bnez a1, .LBB29_18 | |
| # %bb.17: # %entry | |
| fmv.s ft1, fa1 | |
| .LBB29_18: # %entry | |
| fsw fa1, 4(sp) | |
| fsw fa0, 8(sp) | |
| fsw ft7, 12(sp) | |
| fsw ft6, 16(sp) | |
| fsw ft5, 20(sp) | |
| fsw ft4, 24(sp) | |
| fsw ft3, 28(sp) | |
| fsw ft2, 32(sp) | |
| flw ft2, 36(a0) | |
| flt.s a0, ft2, ft1 | |
| bnez a0, .LBB29_20 | |
| # %bb.19: # %entry | |
| fmv.s ft1, ft2 | |
| .LBB29_20: # %entry | |
| fsw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| fsw ft2, 0(sp) | |
| call expf | |
| mv s2, a0 | |
| flw ft0, 32(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s3, a0 | |
| flw ft0, 28(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s4, a0 | |
| flw ft0, 24(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s5, a0 | |
| flw ft0, 20(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s6, a0 | |
| flw ft0, 16(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s8, a0 | |
| flw ft0, 12(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s7, a0 | |
| flw ft0, 8(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s9, a0 | |
| flw ft0, 4(sp) | |
| flw ft1, 36(sp) | |
| fsub.s ft0, ft0, ft1 | |
| fmv.x.w a0, ft0 | |
| call expf | |
| mv s1, a0 | |
| flw ft0, 36(sp) | |
| flw ft1, 0(sp) | |
| fsub.s ft0, ft1, ft0 | |
| lui a0, %hi(.LCPI29_1) | |
| addi a0, a0, %lo(.LCPI29_1) | |
| flw ft1, 0(a0) | |
| fmv.w.x ft2, s2 | |
| fsw ft2, 36(sp) | |
| fadd.s ft1, ft2, ft1 | |
| fmv.w.x ft2, s3 | |
| fsw ft2, 32(sp) | |
| fadd.s ft1, ft1, ft2 | |
| fmv.w.x ft2, s4 | |
| fsw ft2, 28(sp) | |
| fadd.s ft1, ft1, ft2 | |
| fmv.w.x ft2, s5 | |
| fsw ft2, 24(sp) | |
| fadd.s ft1, ft1, ft2 | |
| fmv.x.w a0, ft0 | |
| fmv.w.x ft0, s6 | |
| fsw ft0, 20(sp) | |
| fadd.s ft0, ft1, ft0 | |
| fmv.w.x ft1, s8 | |
| fsw ft1, 16(sp) | |
| fadd.s ft0, ft0, ft1 | |
| fsw ft0, 12(sp) | |
| call expf | |
| fmv.w.x ft0, a0 | |
| fmv.w.x ft1, s1 | |
| fmv.w.x ft2, s9 | |
| fmv.w.x ft3, s7 | |
| flw ft4, 12(sp) | |
| fadd.s ft4, ft4, ft3 | |
| fadd.s ft4, ft4, ft2 | |
| fadd.s ft4, ft4, ft1 | |
| fadd.s ft4, ft4, ft0 | |
| fdiv.s ft0, ft0, ft4 | |
| fsw ft0, 36(s0) | |
| fdiv.s ft0, ft1, ft4 | |
| fsw ft0, 32(s0) | |
| fdiv.s ft0, ft2, ft4 | |
| fsw ft0, 28(s0) | |
| fdiv.s ft0, ft3, ft4 | |
| fsw ft0, 24(s0) | |
| flw ft0, 16(sp) | |
| fdiv.s ft0, ft0, ft4 | |
| fsw ft0, 20(s0) | |
| flw ft0, 20(sp) | |
| fdiv.s ft0, ft0, ft4 | |
| fsw ft0, 16(s0) | |
| flw ft0, 24(sp) | |
| fdiv.s ft0, ft0, ft4 | |
| fsw ft0, 12(s0) | |
| flw ft0, 28(sp) | |
| fdiv.s ft0, ft0, ft4 | |
| fsw ft0, 8(s0) | |
| flw ft0, 32(sp) | |
| fdiv.s ft0, ft0, ft4 | |
| fsw ft0, 4(s0) | |
| flw ft0, 36(sp) | |
| fdiv.s ft0, ft0, ft4 | |
| fsw ft0, 0(s0) | |
| ld s9, 40(sp) | |
| ld s8, 48(sp) | |
| ld s7, 56(sp) | |
| ld s6, 64(sp) | |
| ld s5, 72(sp) | |
| ld s4, 80(sp) | |
| ld s3, 88(sp) | |
| ld s2, 96(sp) | |
| ld s1, 104(sp) | |
| ld s0, 112(sp) | |
| ld ra, 120(sp) | |
| addi sp, sp, 128 | |
| ret | |
| .Lfunc_end29: | |
| .size fuse_softmax_compute_, .Lfunc_end29-fuse_softmax_compute_ | |
| # -- End function | |
| .type __TVMAPISetLastError,@object # @__TVMAPISetLastError | |
| .section .sbss,"aw",@nobits | |
| .weak __TVMAPISetLastError | |
| .p2align 3 | |
| __TVMAPISetLastError: | |
| .quad 0 | |
| .size __TVMAPISetLastError, 8 | |
| .type .L.str,@object # @.str | |
| .section .rodata,"a",@progbits | |
| .L.str: | |
| .asciz "Assert fail: (num_args == 2), fuse_reshape: num_args should be 2" | |
| .size .L.str, 65 | |
| .type .L.str.1,@object # @.str.1 | |
| .L.str.1: | |
| .asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (784 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.1, 124 | |
| .type .L.str.2,@object # @.str.2 | |
| .L.str.2: | |
| .asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (28 == int32(arg1.strides[2]))) && (784 == int32(arg1.strides[1]))) && (784 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.2, 197 | |
| .type .L.str.3,@object # @.str.3 | |
| .L.str.3: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_reshape: Expect arg[0] to be pointer" | |
| .size .L.str.3, 140 | |
| .type .L.str.4,@object # @.str.4 | |
| .L.str.4: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_reshape: Expect arg[1] to be pointer" | |
| .size .L.str.4, 140 | |
| .type .L.str.5,@object # @.str.5 | |
| .L.str.5: | |
| .asciz "Assert fail: (dev_type == 1), device_type need to be 1" | |
| .size .L.str.5, 55 | |
| .type .L.str.6,@object # @.str.6 | |
| .L.str.6: | |
| .asciz "Assert fail: (2 == tvm_struct_get(arg0, 0, 4)), arg0.ndim is expected to equal 2" | |
| .size .L.str.6, 81 | |
| .type .L.str.7,@object # @.str.7 | |
| .L.str.7: | |
| .asciz "Assert fail: (((tvm_struct_get(arg0, 0, 5) == (uint8)2) && (tvm_struct_get(arg0, 0, 6) == (uint8)32)) && (tvm_struct_get(arg0, 0, 7) == (uint16)1)), arg0.dtype is expected to be float32" | |
| .size .L.str.7, 186 | |
| .type .L.str.8,@object # @.str.8 | |
| .L.str.8: | |
| .asciz "Assert fail: (int32(arg0.shape[0]) == 1), Argument arg0.shape[0] has an unsatisfied constraint" | |
| .size .L.str.8, 95 | |
| .type .L.str.9,@object # @.str.9 | |
| .L.str.9: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 784), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.9, 97 | |
| .type .L.str.10,@object # @.str.10 | |
| .L.str.10: | |
| .asciz "Assert fail: (tvm_struct_get(arg0, 0, 8) == (uint64)0), Argument arg0.byte_offset has an unsatisfied constraint" | |
| .size .L.str.10, 112 | |
| .type .L.str.11,@object # @.str.11 | |
| .L.str.11: | |
| .asciz "Assert fail: (4 == tvm_struct_get(arg1, 0, 4)), arg1.ndim is expected to equal 4" | |
| .size .L.str.11, 81 | |
| .type .L.str.12,@object # @.str.12 | |
| .L.str.12: | |
| .asciz "Assert fail: (((tvm_struct_get(arg1, 0, 5) == (uint8)2) && (tvm_struct_get(arg1, 0, 6) == (uint8)32)) && (tvm_struct_get(arg1, 0, 7) == (uint16)1)), arg1.dtype is expected to be float32" | |
| .size .L.str.12, 186 | |
| .type .L.str.13,@object # @.str.13 | |
| .L.str.13: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 1), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.13, 95 | |
| .type .L.str.14,@object # @.str.14 | |
| .L.str.14: | |
| .asciz "Assert fail: (int32(arg1.shape[1]) == 1), Argument arg1.shape[1] has an unsatisfied constraint" | |
| .size .L.str.14, 95 | |
| .type .L.str.15,@object # @.str.15 | |
| .L.str.15: | |
| .asciz "Assert fail: (int32(arg1.shape[2]) == 28), Argument arg1.shape[2] has an unsatisfied constraint" | |
| .size .L.str.15, 96 | |
| .type .L.str.16,@object # @.str.16 | |
| .L.str.16: | |
| .asciz "Assert fail: (int32(arg1.shape[3]) == 28), Argument arg1.shape[3] has an unsatisfied constraint" | |
| .size .L.str.16, 96 | |
| .type .L.str.17,@object # @.str.17 | |
| .L.str.17: | |
| .asciz "Assert fail: (tvm_struct_get(arg1, 0, 8) == (uint64)0), Argument arg1.byte_offset has an unsatisfied constraint" | |
| .size .L.str.17, 112 | |
| .type .L.str.18,@object # @.str.18 | |
| .L.str.18: | |
| .asciz "Assert fail: (1 == tvm_struct_get(arg1, 0, 10)), Argument arg1.device_type has an unsatisfied constraint" | |
| .size .L.str.18, 105 | |
| .type .L.str.19,@object # @.str.19 | |
| .L.str.19: | |
| .asciz "Assert fail: (dev_id == tvm_struct_get(arg1, 0, 9)), Argument arg1.device_id has an unsatisfied constraint" | |
| .size .L.str.19, 107 | |
| .type .L.str.20,@object # @.str.20 | |
| .L.str.20: | |
| .asciz "Assert fail: (num_args == 4), fuse_conv2d: num_args should be 4" | |
| .size .L.str.20, 64 | |
| .type .L.str.21,@object # @.str.21 | |
| .L.str.21: | |
| .asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (28 == int32(arg0.strides[2]))) && (784 == int32(arg0.strides[1]))) && (784 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.21, 197 | |
| .type .L.str.22,@object # @.str.22 | |
| .L.str.22: | |
| .asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (5 == int32(arg1.strides[2]))) && (25 == int32(arg1.strides[1]))) && (25 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.22, 194 | |
| .type .L.str.23,@object # @.str.23 | |
| .L.str.23: | |
| .asciz "Assert fail: (1 == int32(arg2.strides[0])), arg2.strides: expected to be compact array" | |
| .size .L.str.23, 87 | |
| .type .L.str.24,@object # @.str.24 | |
| .L.str.24: | |
| .asciz "Assert fail: ((((1 == int32(arg3.strides[3])) && (28 == int32(arg3.strides[2]))) && (784 == int32(arg3.strides[1]))) && (25088 == int32(arg3.strides[0]))), arg3.strides: expected to be compact array" | |
| .size .L.str.24, 199 | |
| .type .L.str.25,@object # @.str.25 | |
| .L.str.25: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_conv2d: Expect arg[0] to be pointer" | |
| .size .L.str.25, 139 | |
| .type .L.str.26,@object # @.str.26 | |
| .L.str.26: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_conv2d: Expect arg[1] to be pointer" | |
| .size .L.str.26, 139 | |
| .type .L.str.27,@object # @.str.27 | |
| .L.str.27: | |
| .asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_conv2d: Expect arg[2] to be pointer" | |
| .size .L.str.27, 139 | |
| .type .L.str.28,@object # @.str.28 | |
| .L.str.28: | |
| .asciz "Assert fail: ((((arg3.code == 3) || (arg3.code == 13)) || (arg3.code == 7)) || (arg3.code == 4)), fuse_conv2d: Expect arg[3] to be pointer" | |
| .size .L.str.28, 139 | |
| .type .L.str.29,@object # @.str.29 | |
| .L.str.29: | |
| .asciz "Assert fail: (4 == tvm_struct_get(arg0, 0, 4)), arg0.ndim is expected to equal 4" | |
| .size .L.str.29, 81 | |
| .type .L.str.30,@object # @.str.30 | |
| .L.str.30: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 1), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.30, 95 | |
| .type .L.str.31,@object # @.str.31 | |
| .L.str.31: | |
| .asciz "Assert fail: (int32(arg0.shape[2]) == 28), Argument arg0.shape[2] has an unsatisfied constraint" | |
| .size .L.str.31, 96 | |
| .type .L.str.32,@object # @.str.32 | |
| .L.str.32: | |
| .asciz "Assert fail: (int32(arg0.shape[3]) == 28), Argument arg0.shape[3] has an unsatisfied constraint" | |
| .size .L.str.32, 96 | |
| .type .L.str.33,@object # @.str.33 | |
| .L.str.33: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 32), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.33, 96 | |
| .type .L.str.34,@object # @.str.34 | |
| .L.str.34: | |
| .asciz "Assert fail: (int32(arg1.shape[2]) == 5), Argument arg1.shape[2] has an unsatisfied constraint" | |
| .size .L.str.34, 95 | |
| .type .L.str.35,@object # @.str.35 | |
| .L.str.35: | |
| .asciz "Assert fail: (int32(arg1.shape[3]) == 5), Argument arg1.shape[3] has an unsatisfied constraint" | |
| .size .L.str.35, 95 | |
| .type .L.str.36,@object # @.str.36 | |
| .L.str.36: | |
| .asciz "Assert fail: (1 == tvm_struct_get(arg2, 0, 4)), arg2.ndim is expected to equal 1" | |
| .size .L.str.36, 81 | |
| .type .L.str.37,@object # @.str.37 | |
| .L.str.37: | |
| .asciz "Assert fail: (((tvm_struct_get(arg2, 0, 5) == (uint8)2) && (tvm_struct_get(arg2, 0, 6) == (uint8)32)) && (tvm_struct_get(arg2, 0, 7) == (uint16)1)), arg2.dtype is expected to be float32" | |
| .size .L.str.37, 186 | |
| .type .L.str.38,@object # @.str.38 | |
| .L.str.38: | |
| .asciz "Assert fail: (int32(arg2.shape[0]) == 32), Argument arg2.shape[0] has an unsatisfied constraint" | |
| .size .L.str.38, 96 | |
| .type .L.str.39,@object # @.str.39 | |
| .L.str.39: | |
| .asciz "Assert fail: (tvm_struct_get(arg2, 0, 8) == (uint64)0), Argument arg2.byte_offset has an unsatisfied constraint" | |
| .size .L.str.39, 112 | |
| .type .L.str.40,@object # @.str.40 | |
| .L.str.40: | |
| .asciz "Assert fail: (1 == tvm_struct_get(arg2, 0, 10)), Argument arg2.device_type has an unsatisfied constraint" | |
| .size .L.str.40, 105 | |
| .type .L.str.41,@object # @.str.41 | |
| .L.str.41: | |
| .asciz "Assert fail: (dev_id == tvm_struct_get(arg2, 0, 9)), Argument arg2.device_id has an unsatisfied constraint" | |
| .size .L.str.41, 107 | |
| .type .L.str.42,@object # @.str.42 | |
| .L.str.42: | |
| .asciz "Assert fail: (4 == tvm_struct_get(arg3, 0, 4)), arg3.ndim is expected to equal 4" | |
| .size .L.str.42, 81 | |
| .type .L.str.43,@object # @.str.43 | |
| .L.str.43: | |
| .asciz "Assert fail: (((tvm_struct_get(arg3, 0, 5) == (uint8)2) && (tvm_struct_get(arg3, 0, 6) == (uint8)32)) && (tvm_struct_get(arg3, 0, 7) == (uint16)1)), arg3.dtype is expected to be float32" | |
| .size .L.str.43, 186 | |
| .type .L.str.44,@object # @.str.44 | |
| .L.str.44: | |
| .asciz "Assert fail: (int32(arg3.shape[0]) == 1), Argument arg3.shape[0] has an unsatisfied constraint" | |
| .size .L.str.44, 95 | |
| .type .L.str.45,@object # @.str.45 | |
| .L.str.45: | |
| .asciz "Assert fail: (int32(arg3.shape[1]) == 32), Argument arg3.shape[1] has an unsatisfied constraint" | |
| .size .L.str.45, 96 | |
| .type .L.str.46,@object # @.str.46 | |
| .L.str.46: | |
| .asciz "Assert fail: (int32(arg3.shape[2]) == 28), Argument arg3.shape[2] has an unsatisfied constraint" | |
| .size .L.str.46, 96 | |
| .type .L.str.47,@object # @.str.47 | |
| .L.str.47: | |
| .asciz "Assert fail: (int32(arg3.shape[3]) == 28), Argument arg3.shape[3] has an unsatisfied constraint" | |
| .size .L.str.47, 96 | |
| .type .L.str.48,@object # @.str.48 | |
| .L.str.48: | |
| .asciz "Assert fail: (tvm_struct_get(arg3, 0, 8) == (uint64)0), Argument arg3.byte_offset has an unsatisfied constraint" | |
| .size .L.str.48, 112 | |
| .type .L.str.49,@object # @.str.49 | |
| .L.str.49: | |
| .asciz "Assert fail: (1 == tvm_struct_get(arg3, 0, 10)), Argument arg3.device_type has an unsatisfied constraint" | |
| .size .L.str.49, 105 | |
| .type .L.str.50,@object # @.str.50 | |
| .L.str.50: | |
| .asciz "Assert fail: (dev_id == tvm_struct_get(arg3, 0, 9)), Argument arg3.device_id has an unsatisfied constraint" | |
| .size .L.str.50, 107 | |
| .type __TVMBackendAllocWorkspace,@object # @__TVMBackendAllocWorkspace | |
| .section .sbss,"aw",@nobits | |
| .weak __TVMBackendAllocWorkspace | |
| .p2align 3 | |
| __TVMBackendAllocWorkspace: | |
| .quad 0 | |
| .size __TVMBackendAllocWorkspace, 8 | |
| .type __TVMBackendFreeWorkspace,@object # @__TVMBackendFreeWorkspace | |
| .weak __TVMBackendFreeWorkspace | |
| .p2align 3 | |
| __TVMBackendFreeWorkspace: | |
| .quad 0 | |
| .size __TVMBackendFreeWorkspace, 8 | |
| .type .L.str.51,@object # @.str.51 | |
| .section .rodata,"a",@progbits | |
| .L.str.51: | |
| .asciz "Assert fail: (num_args == 2), fuse_relu: num_args should be 2" | |
| .size .L.str.51, 62 | |
| .type .L.str.52,@object # @.str.52 | |
| .L.str.52: | |
| .asciz "Assert fail: (1 == int32(arg0.strides[0])), arg0.strides: expected to be compact array" | |
| .size .L.str.52, 87 | |
| .type .L.str.53,@object # @.str.53 | |
| .L.str.53: | |
| .asciz "Assert fail: (1 == int32(arg1.strides[0])), arg1.strides: expected to be compact array" | |
| .size .L.str.53, 87 | |
| .type .L.str.54,@object # @.str.54 | |
| .L.str.54: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_relu: Expect arg[0] to be pointer" | |
| .size .L.str.54, 137 | |
| .type .L.str.55,@object # @.str.55 | |
| .L.str.55: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_relu: Expect arg[1] to be pointer" | |
| .size .L.str.55, 137 | |
| .type .L.str.56,@object # @.str.56 | |
| .L.str.56: | |
| .asciz "Assert fail: (1 == tvm_struct_get(arg0, 0, 4)), arg0.ndim is expected to equal 1" | |
| .size .L.str.56, 81 | |
| .type .L.str.57,@object # @.str.57 | |
| .L.str.57: | |
| .asciz "Assert fail: (int32(arg0.shape[0]) == 25088), Argument arg0.shape[0] has an unsatisfied constraint" | |
| .size .L.str.57, 99 | |
| .type .L.str.58,@object # @.str.58 | |
| .L.str.58: | |
| .asciz "Assert fail: (1 == tvm_struct_get(arg1, 0, 4)), arg1.ndim is expected to equal 1" | |
| .size .L.str.58, 81 | |
| .type .L.str.59,@object # @.str.59 | |
| .L.str.59: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 25088), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.59, 99 | |
| .type .L.str.60,@object # @.str.60 | |
| .L.str.60: | |
| .asciz "Assert fail: (num_args == 2), fuse_max_pool2d: num_args should be 2" | |
| .size .L.str.60, 68 | |
| .type .L.str.61,@object # @.str.61 | |
| .L.str.61: | |
| .asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (28 == int32(arg0.strides[2]))) && (784 == int32(arg0.strides[1]))) && (25088 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.61, 199 | |
| .type .L.str.62,@object # @.str.62 | |
| .L.str.62: | |
| .asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (14 == int32(arg1.strides[2]))) && (196 == int32(arg1.strides[1]))) && (6272 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.62, 198 | |
| .type .L.str.63,@object # @.str.63 | |
| .L.str.63: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_max_pool2d: Expect arg[0] to be pointer" | |
| .size .L.str.63, 143 | |
| .type .L.str.64,@object # @.str.64 | |
| .L.str.64: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_max_pool2d: Expect arg[1] to be pointer" | |
| .size .L.str.64, 143 | |
| .type .L.str.65,@object # @.str.65 | |
| .L.str.65: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 32), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.65, 96 | |
| .type .L.str.66,@object # @.str.66 | |
| .L.str.66: | |
| .asciz "Assert fail: (int32(arg1.shape[1]) == 32), Argument arg1.shape[1] has an unsatisfied constraint" | |
| .size .L.str.66, 96 | |
| .type .L.str.67,@object # @.str.67 | |
| .L.str.67: | |
| .asciz "Assert fail: (int32(arg1.shape[2]) == 14), Argument arg1.shape[2] has an unsatisfied constraint" | |
| .size .L.str.67, 96 | |
| .type .L.str.68,@object # @.str.68 | |
| .L.str.68: | |
| .asciz "Assert fail: (int32(arg1.shape[3]) == 14), Argument arg1.shape[3] has an unsatisfied constraint" | |
| .size .L.str.68, 96 | |
| .type .L.str.69,@object # @.str.69 | |
| .L.str.69: | |
| .asciz "Assert fail: (num_args == 4), fuse_conv2d_1: num_args should be 4" | |
| .size .L.str.69, 66 | |
| .type .L.str.70,@object # @.str.70 | |
| .L.str.70: | |
| .asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (14 == int32(arg0.strides[2]))) && (196 == int32(arg0.strides[1]))) && (6272 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.70, 198 | |
| .type .L.str.71,@object # @.str.71 | |
| .L.str.71: | |
| .asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (5 == int32(arg1.strides[2]))) && (25 == int32(arg1.strides[1]))) && (800 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.71, 195 | |
| .type .L.str.72,@object # @.str.72 | |
| .L.str.72: | |
| .asciz "Assert fail: ((((1 == int32(arg3.strides[3])) && (14 == int32(arg3.strides[2]))) && (196 == int32(arg3.strides[1]))) && (12544 == int32(arg3.strides[0]))), arg3.strides: expected to be compact array" | |
| .size .L.str.72, 199 | |
| .type .L.str.73,@object # @.str.73 | |
| .L.str.73: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_conv2d_1: Expect arg[0] to be pointer" | |
| .size .L.str.73, 141 | |
| .type .L.str.74,@object # @.str.74 | |
| .L.str.74: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_conv2d_1: Expect arg[1] to be pointer" | |
| .size .L.str.74, 141 | |
| .type .L.str.75,@object # @.str.75 | |
| .L.str.75: | |
| .asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_conv2d_1: Expect arg[2] to be pointer" | |
| .size .L.str.75, 141 | |
| .type .L.str.76,@object # @.str.76 | |
| .L.str.76: | |
| .asciz "Assert fail: ((((arg3.code == 3) || (arg3.code == 13)) || (arg3.code == 7)) || (arg3.code == 4)), fuse_conv2d_1: Expect arg[3] to be pointer" | |
| .size .L.str.76, 141 | |
| .type .L.str.77,@object # @.str.77 | |
| .L.str.77: | |
| .asciz "Assert fail: (int32(arg0.shape[2]) == 14), Argument arg0.shape[2] has an unsatisfied constraint" | |
| .size .L.str.77, 96 | |
| .type .L.str.78,@object # @.str.78 | |
| .L.str.78: | |
| .asciz "Assert fail: (int32(arg0.shape[3]) == 14), Argument arg0.shape[3] has an unsatisfied constraint" | |
| .size .L.str.78, 96 | |
| .type .L.str.79,@object # @.str.79 | |
| .L.str.79: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 64), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.79, 96 | |
| .type .L.str.80,@object # @.str.80 | |
| .L.str.80: | |
| .asciz "Assert fail: (int32(arg2.shape[0]) == 64), Argument arg2.shape[0] has an unsatisfied constraint" | |
| .size .L.str.80, 96 | |
| .type .L.str.81,@object # @.str.81 | |
| .L.str.81: | |
| .asciz "Assert fail: (int32(arg3.shape[1]) == 64), Argument arg3.shape[1] has an unsatisfied constraint" | |
| .size .L.str.81, 96 | |
| .type .L.str.82,@object # @.str.82 | |
| .L.str.82: | |
| .asciz "Assert fail: (int32(arg3.shape[2]) == 14), Argument arg3.shape[2] has an unsatisfied constraint" | |
| .size .L.str.82, 96 | |
| .type .L.str.83,@object # @.str.83 | |
| .L.str.83: | |
| .asciz "Assert fail: (int32(arg3.shape[3]) == 14), Argument arg3.shape[3] has an unsatisfied constraint" | |
| .size .L.str.83, 96 | |
| .type .L.str.84,@object # @.str.84 | |
| .L.str.84: | |
| .asciz "Assert fail: (num_args == 2), fuse_relu_1: num_args should be 2" | |
| .size .L.str.84, 64 | |
| .type .L.str.85,@object # @.str.85 | |
| .L.str.85: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_relu_1: Expect arg[0] to be pointer" | |
| .size .L.str.85, 139 | |
| .type .L.str.86,@object # @.str.86 | |
| .L.str.86: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_relu_1: Expect arg[1] to be pointer" | |
| .size .L.str.86, 139 | |
| .type .L.str.87,@object # @.str.87 | |
| .L.str.87: | |
| .asciz "Assert fail: (int32(arg0.shape[0]) == 12544), Argument arg0.shape[0] has an unsatisfied constraint" | |
| .size .L.str.87, 99 | |
| .type .L.str.88,@object # @.str.88 | |
| .L.str.88: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 12544), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.88, 99 | |
| .type .L.str.89,@object # @.str.89 | |
| .L.str.89: | |
| .asciz "Assert fail: (num_args == 2), fuse_max_pool2d_1: num_args should be 2" | |
| .size .L.str.89, 70 | |
| .type .L.str.90,@object # @.str.90 | |
| .L.str.90: | |
| .asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (14 == int32(arg0.strides[2]))) && (196 == int32(arg0.strides[1]))) && (12544 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.90, 199 | |
| .type .L.str.91,@object # @.str.91 | |
| .L.str.91: | |
| .asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (7 == int32(arg1.strides[2]))) && (49 == int32(arg1.strides[1]))) && (3136 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.91, 196 | |
| .type .L.str.92,@object # @.str.92 | |
| .L.str.92: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_max_pool2d_1: Expect arg[0] to be pointer" | |
| .size .L.str.92, 145 | |
| .type .L.str.93,@object # @.str.93 | |
| .L.str.93: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_max_pool2d_1: Expect arg[1] to be pointer" | |
| .size .L.str.93, 145 | |
| .type .L.str.94,@object # @.str.94 | |
| .L.str.94: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 64), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.94, 96 | |
| .type .L.str.95,@object # @.str.95 | |
| .L.str.95: | |
| .asciz "Assert fail: (int32(arg1.shape[1]) == 64), Argument arg1.shape[1] has an unsatisfied constraint" | |
| .size .L.str.95, 96 | |
| .type .L.str.96,@object # @.str.96 | |
| .L.str.96: | |
| .asciz "Assert fail: (int32(arg1.shape[2]) == 7), Argument arg1.shape[2] has an unsatisfied constraint" | |
| .size .L.str.96, 95 | |
| .type .L.str.97,@object # @.str.97 | |
| .L.str.97: | |
| .asciz "Assert fail: (int32(arg1.shape[3]) == 7), Argument arg1.shape[3] has an unsatisfied constraint" | |
| .size .L.str.97, 95 | |
| .type .L.str.98,@object # @.str.98 | |
| .L.str.98: | |
| .asciz "Assert fail: (num_args == 2), fuse_transpose: num_args should be 2" | |
| .size .L.str.98, 67 | |
| .type .L.str.99,@object # @.str.99 | |
| .L.str.99: | |
| .asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (7 == int32(arg0.strides[2]))) && (49 == int32(arg0.strides[1]))) && (3136 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.99, 196 | |
| .type .L.str.100,@object # @.str.100 | |
| .L.str.100: | |
| .asciz "Assert fail: ((((1 == int32(arg1.strides[3])) && (64 == int32(arg1.strides[2]))) && (448 == int32(arg1.strides[1]))) && (3136 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.100, 198 | |
| .type .L.str.101,@object # @.str.101 | |
| .L.str.101: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_transpose: Expect arg[0] to be pointer" | |
| .size .L.str.101, 142 | |
| .type .L.str.102,@object # @.str.102 | |
| .L.str.102: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_transpose: Expect arg[1] to be pointer" | |
| .size .L.str.102, 142 | |
| .type .L.str.103,@object # @.str.103 | |
| .L.str.103: | |
| .asciz "Assert fail: (int32(arg0.shape[2]) == 7), Argument arg0.shape[2] has an unsatisfied constraint" | |
| .size .L.str.103, 95 | |
| .type .L.str.104,@object # @.str.104 | |
| .L.str.104: | |
| .asciz "Assert fail: (int32(arg0.shape[3]) == 7), Argument arg0.shape[3] has an unsatisfied constraint" | |
| .size .L.str.104, 95 | |
| .type .L.str.105,@object # @.str.105 | |
| .L.str.105: | |
| .asciz "Assert fail: (int32(arg1.shape[1]) == 7), Argument arg1.shape[1] has an unsatisfied constraint" | |
| .size .L.str.105, 95 | |
| .type .L.str.106,@object # @.str.106 | |
| .L.str.106: | |
| .asciz "Assert fail: (int32(arg1.shape[3]) == 64), Argument arg1.shape[3] has an unsatisfied constraint" | |
| .size .L.str.106, 96 | |
| .type .L.str.107,@object # @.str.107 | |
| .L.str.107: | |
| .asciz "Assert fail: (num_args == 2), fuse_reshape_1: num_args should be 2" | |
| .size .L.str.107, 67 | |
| .type .L.str.108,@object # @.str.108 | |
| .L.str.108: | |
| .asciz "Assert fail: ((((1 == int32(arg0.strides[3])) && (64 == int32(arg0.strides[2]))) && (448 == int32(arg0.strides[1]))) && (3136 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.108, 198 | |
| .type .L.str.109,@object # @.str.109 | |
| .L.str.109: | |
| .asciz "Assert fail: ((1 == int32(arg1.strides[1])) && (3136 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.109, 125 | |
| .type .L.str.110,@object # @.str.110 | |
| .L.str.110: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_reshape_1: Expect arg[0] to be pointer" | |
| .size .L.str.110, 142 | |
| .type .L.str.111,@object # @.str.111 | |
| .L.str.111: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_reshape_1: Expect arg[1] to be pointer" | |
| .size .L.str.111, 142 | |
| .type .L.str.112,@object # @.str.112 | |
| .L.str.112: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 7), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.112, 95 | |
| .type .L.str.113,@object # @.str.113 | |
| .L.str.113: | |
| .asciz "Assert fail: (int32(arg0.shape[3]) == 64), Argument arg0.shape[3] has an unsatisfied constraint" | |
| .size .L.str.113, 96 | |
| .type .L.str.114,@object # @.str.114 | |
| .L.str.114: | |
| .asciz "Assert fail: (2 == tvm_struct_get(arg1, 0, 4)), arg1.ndim is expected to equal 2" | |
| .size .L.str.114, 81 | |
| .type .L.str.115,@object # @.str.115 | |
| .L.str.115: | |
| .asciz "Assert fail: (int32(arg1.shape[1]) == 3136), Argument arg1.shape[1] has an unsatisfied constraint" | |
| .size .L.str.115, 98 | |
| .type .L.str.116,@object # @.str.116 | |
| .L.str.116: | |
| .asciz "Assert fail: (num_args == 3), fuse_matmul: num_args should be 3" | |
| .size .L.str.116, 64 | |
| .type .L.str.117,@object # @.str.117 | |
| .L.str.117: | |
| .asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (3136 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.117, 125 | |
| .type .L.str.118,@object # @.str.118 | |
| .L.str.118: | |
| .asciz "Assert fail: ((1 == int32(arg1.strides[1])) && (100 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.118, 124 | |
| .type .L.str.119,@object # @.str.119 | |
| .L.str.119: | |
| .asciz "Assert fail: ((1 == int32(arg2.strides[1])) && (100 == int32(arg2.strides[0]))), arg2.strides: expected to be compact array" | |
| .size .L.str.119, 124 | |
| .type .L.str.120,@object # @.str.120 | |
| .L.str.120: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_matmul: Expect arg[0] to be pointer" | |
| .size .L.str.120, 139 | |
| .type .L.str.121,@object # @.str.121 | |
| .L.str.121: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_matmul: Expect arg[1] to be pointer" | |
| .size .L.str.121, 139 | |
| .type .L.str.122,@object # @.str.122 | |
| .L.str.122: | |
| .asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_matmul: Expect arg[2] to be pointer" | |
| .size .L.str.122, 139 | |
| .type .L.str.123,@object # @.str.123 | |
| .L.str.123: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 3136), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.123, 98 | |
| .type .L.str.124,@object # @.str.124 | |
| .L.str.124: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 3136), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.124, 98 | |
| .type .L.str.125,@object # @.str.125 | |
| .L.str.125: | |
| .asciz "Assert fail: (int32(arg1.shape[1]) == 100), Argument arg1.shape[1] has an unsatisfied constraint" | |
| .size .L.str.125, 97 | |
| .type .L.str.126,@object # @.str.126 | |
| .L.str.126: | |
| .asciz "Assert fail: (2 == tvm_struct_get(arg2, 0, 4)), arg2.ndim is expected to equal 2" | |
| .size .L.str.126, 81 | |
| .type .L.str.127,@object # @.str.127 | |
| .L.str.127: | |
| .asciz "Assert fail: (int32(arg2.shape[0]) == 1), Argument arg2.shape[0] has an unsatisfied constraint" | |
| .size .L.str.127, 95 | |
| .type .L.str.128,@object # @.str.128 | |
| .L.str.128: | |
| .asciz "Assert fail: (int32(arg2.shape[1]) == 100), Argument arg2.shape[1] has an unsatisfied constraint" | |
| .size .L.str.128, 97 | |
| .type .L.str.129,@object # @.str.129 | |
| .L.str.129: | |
| .asciz "Assert fail: (num_args == 3), fuse_elemwise_add: num_args should be 3" | |
| .size .L.str.129, 70 | |
| .type .L.str.130,@object # @.str.130 | |
| .L.str.130: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_elemwise_add: Expect arg[0] to be pointer" | |
| .size .L.str.130, 145 | |
| .type .L.str.131,@object # @.str.131 | |
| .L.str.131: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_elemwise_add: Expect arg[1] to be pointer" | |
| .size .L.str.131, 145 | |
| .type .L.str.132,@object # @.str.132 | |
| .L.str.132: | |
| .asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_elemwise_add: Expect arg[2] to be pointer" | |
| .size .L.str.132, 145 | |
| .type .L.str.133,@object # @.str.133 | |
| .L.str.133: | |
| .asciz "Assert fail: (int32(arg0.shape[0]) == 100), Argument arg0.shape[0] has an unsatisfied constraint" | |
| .size .L.str.133, 97 | |
| .type .L.str.134,@object # @.str.134 | |
| .L.str.134: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 100), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.134, 97 | |
| .type .L.str.135,@object # @.str.135 | |
| .L.str.135: | |
| .asciz "Assert fail: (int32(arg2.shape[0]) == 100), Argument arg2.shape[0] has an unsatisfied constraint" | |
| .size .L.str.135, 97 | |
| .type .L.str.136,@object # @.str.136 | |
| .L.str.136: | |
| .asciz "Assert fail: (num_args == 2), fuse_sigmoid: num_args should be 2" | |
| .size .L.str.136, 65 | |
| .type .L.str.137,@object # @.str.137 | |
| .L.str.137: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_sigmoid: Expect arg[0] to be pointer" | |
| .size .L.str.137, 140 | |
| .type .L.str.138,@object # @.str.138 | |
| .L.str.138: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_sigmoid: Expect arg[1] to be pointer" | |
| .size .L.str.138, 140 | |
| .type .L.str.139,@object # @.str.139 | |
| .L.str.139: | |
| .asciz "Assert fail: (num_args == 3), fuse_matmul_1: num_args should be 3" | |
| .size .L.str.139, 66 | |
| .type .L.str.140,@object # @.str.140 | |
| .L.str.140: | |
| .asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (100 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.140, 124 | |
| .type .L.str.141,@object # @.str.141 | |
| .L.str.141: | |
| .asciz "Assert fail: ((1 == int32(arg1.strides[1])) && (10 == int32(arg1.strides[0]))), arg1.strides: expected to be compact array" | |
| .size .L.str.141, 123 | |
| .type .L.str.142,@object # @.str.142 | |
| .L.str.142: | |
| .asciz "Assert fail: ((1 == int32(arg2.strides[1])) && (10 == int32(arg2.strides[0]))), arg2.strides: expected to be compact array" | |
| .size .L.str.142, 123 | |
| .type .L.str.143,@object # @.str.143 | |
| .L.str.143: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_matmul_1: Expect arg[0] to be pointer" | |
| .size .L.str.143, 141 | |
| .type .L.str.144,@object # @.str.144 | |
| .L.str.144: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_matmul_1: Expect arg[1] to be pointer" | |
| .size .L.str.144, 141 | |
| .type .L.str.145,@object # @.str.145 | |
| .L.str.145: | |
| .asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_matmul_1: Expect arg[2] to be pointer" | |
| .size .L.str.145, 141 | |
| .type .L.str.146,@object # @.str.146 | |
| .L.str.146: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 100), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.146, 97 | |
| .type .L.str.147,@object # @.str.147 | |
| .L.str.147: | |
| .asciz "Assert fail: (int32(arg1.shape[1]) == 10), Argument arg1.shape[1] has an unsatisfied constraint" | |
| .size .L.str.147, 96 | |
| .type .L.str.148,@object # @.str.148 | |
| .L.str.148: | |
| .asciz "Assert fail: (int32(arg2.shape[1]) == 10), Argument arg2.shape[1] has an unsatisfied constraint" | |
| .size .L.str.148, 96 | |
| .type .L.str.149,@object # @.str.149 | |
| .L.str.149: | |
| .asciz "Assert fail: (num_args == 3), fuse_elemwise_add_1: num_args should be 3" | |
| .size .L.str.149, 72 | |
| .type .L.str.150,@object # @.str.150 | |
| .L.str.150: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_elemwise_add_1: Expect arg[0] to be pointer" | |
| .size .L.str.150, 147 | |
| .type .L.str.151,@object # @.str.151 | |
| .L.str.151: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_elemwise_add_1: Expect arg[1] to be pointer" | |
| .size .L.str.151, 147 | |
| .type .L.str.152,@object # @.str.152 | |
| .L.str.152: | |
| .asciz "Assert fail: ((((arg2.code == 3) || (arg2.code == 13)) || (arg2.code == 7)) || (arg2.code == 4)), fuse_elemwise_add_1: Expect arg[2] to be pointer" | |
| .size .L.str.152, 147 | |
| .type .L.str.153,@object # @.str.153 | |
| .L.str.153: | |
| .asciz "Assert fail: (int32(arg0.shape[0]) == 10), Argument arg0.shape[0] has an unsatisfied constraint" | |
| .size .L.str.153, 96 | |
| .type .L.str.154,@object # @.str.154 | |
| .L.str.154: | |
| .asciz "Assert fail: (int32(arg1.shape[0]) == 10), Argument arg1.shape[0] has an unsatisfied constraint" | |
| .size .L.str.154, 96 | |
| .type .L.str.155,@object # @.str.155 | |
| .L.str.155: | |
| .asciz "Assert fail: (int32(arg2.shape[0]) == 10), Argument arg2.shape[0] has an unsatisfied constraint" | |
| .size .L.str.155, 96 | |
| .type .L.str.156,@object # @.str.156 | |
| .L.str.156: | |
| .asciz "Assert fail: (num_args == 2), fuse_softmax: num_args should be 2" | |
| .size .L.str.156, 65 | |
| .type .L.str.157,@object # @.str.157 | |
| .L.str.157: | |
| .asciz "Assert fail: ((1 == int32(arg0.strides[1])) && (10 == int32(arg0.strides[0]))), arg0.strides: expected to be compact array" | |
| .size .L.str.157, 123 | |
| .type .L.str.158,@object # @.str.158 | |
| .L.str.158: | |
| .asciz "Assert fail: ((((arg0.code == 3) || (arg0.code == 13)) || (arg0.code == 7)) || (arg0.code == 4)), fuse_softmax: Expect arg[0] to be pointer" | |
| .size .L.str.158, 140 | |
| .type .L.str.159,@object # @.str.159 | |
| .L.str.159: | |
| .asciz "Assert fail: ((((arg1.code == 3) || (arg1.code == 13)) || (arg1.code == 7)) || (arg1.code == 4)), fuse_softmax: Expect arg[1] to be pointer" | |
| .size .L.str.159, 140 | |
| .type .L.str.160,@object # @.str.160 | |
| .L.str.160: | |
| .asciz "Assert fail: (int32(arg0.shape[1]) == 10), Argument arg0.shape[1] has an unsatisfied constraint" | |
| .size .L.str.160, 96 | |
| .type __tvm_main__,@object # @__tvm_main__ | |
| .weak __tvm_main__ | |
| __tvm_main__: | |
| .asciz "fuse_reshape" | |
| .size __tvm_main__, 13 | |
| .section ".note.GNU-stack","",@progbits |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment