239 lines
3.3 KiB
ArmAsm
239 lines
3.3 KiB
ArmAsm
|
.file "matmul2.sy"
|
||
|
.option pic
|
||
|
.attribute arch, "rv64i2p1_m2p0_a2p1_f2p2_d2p2_c2p0_zicsr2p0_zifencei2p0"
|
||
|
.attribute unaligned_access, 0
|
||
|
.attribute stack_align, 16
|
||
|
.text
|
||
|
.section .text.startup,"ax",@progbits
|
||
|
.align 1
|
||
|
.globl main
|
||
|
.type main, @function
|
||
|
main:
|
||
|
addi sp,sp,-48
|
||
|
sd s0,32(sp)
|
||
|
sd s3,8(sp)
|
||
|
lla s0,a
|
||
|
li s3,4096
|
||
|
sd s1,24(sp)
|
||
|
sd s2,16(sp)
|
||
|
sd s4,0(sp)
|
||
|
sd ra,40(sp)
|
||
|
lla s1,a+4000000
|
||
|
mv s2,s0
|
||
|
li s4,1000
|
||
|
addi s3,s3,-96
|
||
|
j .L3
|
||
|
.L33:
|
||
|
beq s2,s1,.L32
|
||
|
.L3:
|
||
|
mv a0,s2
|
||
|
call getarray@plt
|
||
|
add s2,s2,s3
|
||
|
beq a0,s4,.L33
|
||
|
.L2:
|
||
|
ld ra,40(sp)
|
||
|
ld s0,32(sp)
|
||
|
ld s1,24(sp)
|
||
|
ld s2,16(sp)
|
||
|
ld s3,8(sp)
|
||
|
ld s4,0(sp)
|
||
|
addi sp,sp,48
|
||
|
jr ra
|
||
|
.L32:
|
||
|
li a0,24
|
||
|
call _sysy_starttime@plt
|
||
|
lla t1,b
|
||
|
li a1,-4001792
|
||
|
li a2,4096
|
||
|
lla a6,a+4004000
|
||
|
mv a0,t1
|
||
|
addi a1,a1,1792
|
||
|
addi a2,a2,-96
|
||
|
.L4:
|
||
|
add a5,s1,a1
|
||
|
mv a4,a0
|
||
|
.L5:
|
||
|
lw a3,0(a5)
|
||
|
add a5,a5,a2
|
||
|
addi a4,a4,4
|
||
|
sw a3,-4(a4)
|
||
|
bne a5,s1,.L5
|
||
|
addi s1,a5,4
|
||
|
add a0,a0,a2
|
||
|
bne s1,a6,.L4
|
||
|
li t6,4001792
|
||
|
li a5,4005888
|
||
|
lla t3,c
|
||
|
addi t6,t6,-1792
|
||
|
addi a5,a5,-1888
|
||
|
li a6,4096
|
||
|
li t5,-4001792
|
||
|
add t6,t1,t6
|
||
|
mv t2,t3
|
||
|
li t0,0
|
||
|
add t1,t1,a5
|
||
|
addi a6,a6,-96
|
||
|
addi t5,t5,1792
|
||
|
li s1,1000
|
||
|
.L9:
|
||
|
mul t4,t0,a6
|
||
|
mv a0,t6
|
||
|
mv a7,t2
|
||
|
add t4,t4,s0
|
||
|
.L11:
|
||
|
add a4,a0,t5
|
||
|
mv a3,t4
|
||
|
li a2,0
|
||
|
.L7:
|
||
|
lw a1,0(a3)
|
||
|
lw a5,0(a4)
|
||
|
add a4,a4,a6
|
||
|
addi a3,a3,4
|
||
|
mulw a5,a5,a1
|
||
|
addw a2,a5,a2
|
||
|
bne a4,a0,.L7
|
||
|
sw a2,0(a7)
|
||
|
addi a0,a4,4
|
||
|
addi a7,a7,4
|
||
|
bne a0,t1,.L11
|
||
|
addi t0,t0,1
|
||
|
add t2,t2,a6
|
||
|
bne t0,s1,.L9
|
||
|
add a6,t3,a6
|
||
|
li t5,-2147483648
|
||
|
li t4,-1
|
||
|
li a0,4096
|
||
|
lla t1,c+4004000
|
||
|
mv a1,a6
|
||
|
lla a7,c
|
||
|
xori t5,t5,-1
|
||
|
srli t4,t4,32
|
||
|
addi a0,a0,-96
|
||
|
.L10:
|
||
|
mv a5,a7
|
||
|
mv a2,t5
|
||
|
.L13:
|
||
|
lw a3,0(a5)
|
||
|
addi a5,a5,4
|
||
|
mv a4,a3
|
||
|
ble a3,a2,.L12
|
||
|
mv a4,a2
|
||
|
.L12:
|
||
|
sext.w a2,a4
|
||
|
bne a5,a1,.L13
|
||
|
slli a3,a4,32
|
||
|
and a5,t4,a4
|
||
|
or a5,a5,a3
|
||
|
mv a4,a7
|
||
|
.L14:
|
||
|
sd a5,0(a4)
|
||
|
addi a4,a4,8
|
||
|
bne a4,a1,.L14
|
||
|
add a1,a4,a0
|
||
|
add a7,a7,a0
|
||
|
bne a1,t1,.L10
|
||
|
li a0,-4001792
|
||
|
li a2,4096
|
||
|
lla a1,c+4000000
|
||
|
addi a0,a0,1792
|
||
|
addi a2,a2,-96
|
||
|
.L17:
|
||
|
add a5,a1,a0
|
||
|
mv a3,t3
|
||
|
.L16:
|
||
|
lw a4,0(a5)
|
||
|
addi a3,a3,4
|
||
|
add a5,a5,a2
|
||
|
negw a4,a4
|
||
|
sw a4,-4(a3)
|
||
|
bne a5,a1,.L16
|
||
|
addi a1,a5,4
|
||
|
add t3,t3,a2
|
||
|
bne a1,t1,.L17
|
||
|
li a2,-4096
|
||
|
li a3,4096
|
||
|
li s0,0
|
||
|
addi a2,a2,96
|
||
|
addi a3,a3,-96
|
||
|
.L18:
|
||
|
add a5,a6,a2
|
||
|
.L19:
|
||
|
lw a4,0(a5)
|
||
|
addi a5,a5,4
|
||
|
addw s0,a4,s0
|
||
|
bne a6,a5,.L19
|
||
|
add a6,a6,a3
|
||
|
bne a6,t1,.L18
|
||
|
li a0,93
|
||
|
call _sysy_stoptime@plt
|
||
|
mv a0,s0
|
||
|
call putint@plt
|
||
|
li a0,0
|
||
|
j .L2
|
||
|
.size main, .-main
|
||
|
.globl c
|
||
|
.globl b
|
||
|
.globl a
|
||
|
.globl _sysy_idx
|
||
|
.globl _sysy_us
|
||
|
.globl _sysy_s
|
||
|
.globl _sysy_m
|
||
|
.globl _sysy_h
|
||
|
.globl _sysy_l2
|
||
|
.globl _sysy_l1
|
||
|
.globl _sysy_end
|
||
|
.globl _sysy_start
|
||
|
.bss
|
||
|
.align 3
|
||
|
.type c, @object
|
||
|
.size c, 4000000
|
||
|
c:
|
||
|
.zero 4000000
|
||
|
.type b, @object
|
||
|
.size b, 4000000
|
||
|
b:
|
||
|
.zero 4000000
|
||
|
.type a, @object
|
||
|
.size a, 4000000
|
||
|
a:
|
||
|
.zero 4000000
|
||
|
.type _sysy_idx, @object
|
||
|
.size _sysy_idx, 4
|
||
|
_sysy_idx:
|
||
|
.zero 4
|
||
|
.zero 4
|
||
|
.type _sysy_us, @object
|
||
|
.size _sysy_us, 4096
|
||
|
_sysy_us:
|
||
|
.zero 4096
|
||
|
.type _sysy_s, @object
|
||
|
.size _sysy_s, 4096
|
||
|
_sysy_s:
|
||
|
.zero 4096
|
||
|
.type _sysy_m, @object
|
||
|
.size _sysy_m, 4096
|
||
|
_sysy_m:
|
||
|
.zero 4096
|
||
|
.type _sysy_h, @object
|
||
|
.size _sysy_h, 4096
|
||
|
_sysy_h:
|
||
|
.zero 4096
|
||
|
.type _sysy_l2, @object
|
||
|
.size _sysy_l2, 4096
|
||
|
_sysy_l2:
|
||
|
.zero 4096
|
||
|
.type _sysy_l1, @object
|
||
|
.size _sysy_l1, 4096
|
||
|
_sysy_l1:
|
||
|
.zero 4096
|
||
|
.type _sysy_end, @object
|
||
|
.size _sysy_end, 16
|
||
|
_sysy_end:
|
||
|
.zero 16
|
||
|
.type _sysy_start, @object
|
||
|
.size _sysy_start, 16
|
||
|
_sysy_start:
|
||
|
.zero 16
|
||
|
.ident "GCC: (Debian 12.2.0-13) 12.2.0"
|
||
|
.section .note.GNU-stack,"",@progbits
|