1959 lines
83 KiB
Plaintext
1959 lines
83 KiB
Plaintext
|
|
vortex_test.elf: file format elf32-littleriscv
|
|
|
|
|
|
Disassembly of section .text:
|
|
|
|
80000000 <_start>:
|
|
80000000: 00200513 li a0,2
|
|
80000004: 02051073 csrw 0x20,a0
|
|
80000008: 00200513 li a0,2
|
|
8000000c: 02151073 csrw 0x21,a0
|
|
80000010: f1401073 csrw mhartid,zero
|
|
80000014: 30101073 csrw misa,zero
|
|
80000018: 7ffff137 lui sp,0x7ffff
|
|
8000001c: 1b0000ef jal ra,800001cc <vx_before_main>
|
|
80000020: 6a8010ef jal ra,800016c8 <main>
|
|
80000024: 00000073 ecall
|
|
|
|
80000028 <vx_createThreads>:
|
|
80000028: 00068b93 mv s7,a3
|
|
8000002c: 00070d13 mv s10,a4
|
|
80000030: 00010f13 mv t5,sp
|
|
80000034: 00050393 mv t2,a0
|
|
|
|
80000038 <loop_init>:
|
|
80000038: 00100513 li a0,1
|
|
|
|
8000003c <loop_cond>:
|
|
8000003c: 00755c63 bge a0,t2,80000054 <loop_done>
|
|
|
|
80000040 <loop_body>:
|
|
80000040: 80010113 addi sp,sp,-2048 # 7fffe800 <SIZE+0x7fffe7ce>
|
|
80000044: 00050313 mv t1,a0
|
|
80000048: 0003506b 0x3506b
|
|
|
|
8000004c <loop_inc>:
|
|
8000004c: 00150513 addi a0,a0,1
|
|
80000050: fedff06f j 8000003c <loop_cond>
|
|
|
|
80000054 <loop_done>:
|
|
80000054: 00000013 nop
|
|
80000058: 00000013 nop
|
|
8000005c: 00000013 nop
|
|
80000060: 00000013 nop
|
|
80000064: 00000013 nop
|
|
80000068: 00000013 nop
|
|
8000006c: 000f0113 mv sp,t5
|
|
80000070: 00000513 li a0,0
|
|
80000074: 00060f93 mv t6,a2
|
|
80000078: 00038d93 mv s11,t2
|
|
8000007c: 01bfe0eb 0x1bfe0eb
|
|
80000080: 00000517 auipc a0,0x0
|
|
80000084: 1b050513 addi a0,a0,432 # 80000230 <vx_reschedule_warps>
|
|
80000088: 0005406b 0x5406b
|
|
|
|
8000008c <vx_wspawn>:
|
|
8000008c: 00000317 auipc t1,0x0
|
|
80000090: f9c30313 addi t1,t1,-100 # 80000028 <vx_createThreads>
|
|
80000094: 0003006b 0x3006b
|
|
80000098: 00008067 ret
|
|
|
|
8000009c <vx_save_context>:
|
|
8000009c: 01000217 auipc tp,0x1000
|
|
800000a0: 20020213 addi tp,tp,512 # 8100029c <context>
|
|
800000a4: 00022023 sw zero,0(tp) # 0 <A_WARPS-0x7>
|
|
800000a8: 00122223 sw ra,4(tp) # 4 <A_WARPS-0x3>
|
|
800000ac: 00222423 sw sp,8(tp) # 8 <A_WARPS+0x1>
|
|
800000b0: 00322623 sw gp,12(tp) # c <A_WARPS+0x5>
|
|
800000b4: 00422823 sw tp,16(tp) # 10 <A_WARPS+0x9>
|
|
800000b8: 00522a23 sw t0,20(tp) # 14 <A_WARPS+0xd>
|
|
800000bc: 00622c23 sw t1,24(tp) # 18 <A_WARPS+0x11>
|
|
800000c0: 00722e23 sw t2,28(tp) # 1c <A_WARPS+0x15>
|
|
800000c4: 02822023 sw s0,32(tp) # 20 <A_WARPS+0x19>
|
|
800000c8: 02922223 sw s1,36(tp) # 24 <A_WARPS+0x1d>
|
|
800000cc: 02a22423 sw a0,40(tp) # 28 <A_WARPS+0x21>
|
|
800000d0: 02b22623 sw a1,44(tp) # 2c <A_WARPS+0x25>
|
|
800000d4: 02c22823 sw a2,48(tp) # 30 <A_WARPS+0x29>
|
|
800000d8: 02d22a23 sw a3,52(tp) # 34 <SIZE+0x2>
|
|
800000dc: 02e22c23 sw a4,56(tp) # 38 <SIZE+0x6>
|
|
800000e0: 02f22e23 sw a5,60(tp) # 3c <SIZE+0xa>
|
|
800000e4: 05022023 sw a6,64(tp) # 40 <SIZE+0xe>
|
|
800000e8: 05122223 sw a7,68(tp) # 44 <SIZE+0x12>
|
|
800000ec: 05222423 sw s2,72(tp) # 48 <SIZE+0x16>
|
|
800000f0: 05322623 sw s3,76(tp) # 4c <SIZE+0x1a>
|
|
800000f4: 05422823 sw s4,80(tp) # 50 <SIZE+0x1e>
|
|
800000f8: 05522a23 sw s5,84(tp) # 54 <SIZE+0x22>
|
|
800000fc: 05622c23 sw s6,88(tp) # 58 <SIZE+0x26>
|
|
80000100: 05722e23 sw s7,92(tp) # 5c <SIZE+0x2a>
|
|
80000104: 07822023 sw s8,96(tp) # 60 <SIZE+0x2e>
|
|
80000108: 07922223 sw s9,100(tp) # 64 <SIZE+0x32>
|
|
8000010c: 07a22423 sw s10,104(tp) # 68 <SIZE+0x36>
|
|
80000110: 07b22623 sw s11,108(tp) # 6c <SIZE+0x3a>
|
|
80000114: 07c22823 sw t3,112(tp) # 70 <SIZE+0x3e>
|
|
80000118: 07d22a23 sw t4,116(tp) # 74 <SIZE+0x42>
|
|
8000011c: 07e22c23 sw t5,120(tp) # 78 <SIZE+0x46>
|
|
80000120: 07f22e23 sw t6,124(tp) # 7c <SIZE+0x4a>
|
|
80000124: 00100213 li tp,1
|
|
80000128: 00008067 ret
|
|
|
|
8000012c <vx_load_context>:
|
|
8000012c: 01000217 auipc tp,0x1000
|
|
80000130: 17020213 addi tp,tp,368 # 8100029c <context>
|
|
80000134: 00022003 lw zero,0(tp) # 0 <A_WARPS-0x7>
|
|
80000138: 00422083 lw ra,4(tp) # 4 <A_WARPS-0x3>
|
|
8000013c: 00822103 lw sp,8(tp) # 8 <A_WARPS+0x1>
|
|
80000140: 00c22183 lw gp,12(tp) # c <A_WARPS+0x5>
|
|
80000144: 01022203 lw tp,16(tp) # 10 <A_WARPS+0x9>
|
|
80000148: 01422283 lw t0,20(tp) # 14 <A_WARPS+0xd>
|
|
8000014c: 01822303 lw t1,24(tp) # 18 <A_WARPS+0x11>
|
|
80000150: 01c22383 lw t2,28(tp) # 1c <A_WARPS+0x15>
|
|
80000154: 02022403 lw s0,32(tp) # 20 <A_WARPS+0x19>
|
|
80000158: 02422483 lw s1,36(tp) # 24 <A_WARPS+0x1d>
|
|
8000015c: 02822503 lw a0,40(tp) # 28 <A_WARPS+0x21>
|
|
80000160: 02c22583 lw a1,44(tp) # 2c <A_WARPS+0x25>
|
|
80000164: 03022603 lw a2,48(tp) # 30 <A_WARPS+0x29>
|
|
80000168: 03422683 lw a3,52(tp) # 34 <SIZE+0x2>
|
|
8000016c: 03822703 lw a4,56(tp) # 38 <SIZE+0x6>
|
|
80000170: 03c22783 lw a5,60(tp) # 3c <SIZE+0xa>
|
|
80000174: 04022803 lw a6,64(tp) # 40 <SIZE+0xe>
|
|
80000178: 04422883 lw a7,68(tp) # 44 <SIZE+0x12>
|
|
8000017c: 04822903 lw s2,72(tp) # 48 <SIZE+0x16>
|
|
80000180: 04c22983 lw s3,76(tp) # 4c <SIZE+0x1a>
|
|
80000184: 05022a03 lw s4,80(tp) # 50 <SIZE+0x1e>
|
|
80000188: 05422a83 lw s5,84(tp) # 54 <SIZE+0x22>
|
|
8000018c: 05822b03 lw s6,88(tp) # 58 <SIZE+0x26>
|
|
80000190: 05c22b83 lw s7,92(tp) # 5c <SIZE+0x2a>
|
|
80000194: 06022c03 lw s8,96(tp) # 60 <SIZE+0x2e>
|
|
80000198: 06422c83 lw s9,100(tp) # 64 <SIZE+0x32>
|
|
8000019c: 06822d03 lw s10,104(tp) # 68 <SIZE+0x36>
|
|
800001a0: 06c22d83 lw s11,108(tp) # 6c <SIZE+0x3a>
|
|
800001a4: 07022e03 lw t3,112(tp) # 70 <SIZE+0x3e>
|
|
800001a8: 07422e83 lw t4,116(tp) # 74 <SIZE+0x42>
|
|
800001ac: 07822f03 lw t5,120(tp) # 78 <SIZE+0x46>
|
|
800001b0: 07c22f83 lw t6,124(tp) # 7c <SIZE+0x4a>
|
|
800001b4: 00000213 li tp,0
|
|
800001b8: 00008067 ret
|
|
|
|
800001bc <vx_available_warps>:
|
|
800001bc: 02002573 csrr a0,0x20
|
|
800001c0: 00008067 ret
|
|
|
|
800001c4 <vx_available_threads>:
|
|
800001c4: 02102573 csrr a0,0x21
|
|
800001c8: 00008067 ret
|
|
|
|
800001cc <vx_before_main>:
|
|
800001cc: fe010113 addi sp,sp,-32
|
|
800001d0: 00112e23 sw ra,28(sp)
|
|
800001d4: 00812c23 sw s0,24(sp)
|
|
800001d8: 02010413 addi s0,sp,32
|
|
800001dc: fe042623 sw zero,-20(s0)
|
|
800001e0: 0300006f j 80000210 <vx_before_main+0x44>
|
|
800001e4: fec42703 lw a4,-20(s0)
|
|
800001e8: 4c400793 li a5,1220
|
|
800001ec: 02f70733 mul a4,a4,a5
|
|
800001f0: 810007b7 lui a5,0x81000
|
|
800001f4: 31c78793 addi a5,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
800001f8: 00f707b3 add a5,a4,a5
|
|
800001fc: 00078513 mv a0,a5
|
|
80000200: 404000ef jal ra,80000604 <queue_initialize>
|
|
80000204: fec42783 lw a5,-20(s0)
|
|
80000208: 00178793 addi a5,a5,1
|
|
8000020c: fef42623 sw a5,-20(s0)
|
|
80000210: fec42703 lw a4,-20(s0)
|
|
80000214: 00700793 li a5,7
|
|
80000218: fce7d6e3 bge a5,a4,800001e4 <vx_before_main+0x18>
|
|
8000021c: 00000013 nop
|
|
80000220: 01c12083 lw ra,28(sp)
|
|
80000224: 01812403 lw s0,24(sp)
|
|
80000228: 02010113 addi sp,sp,32
|
|
8000022c: 00008067 ret
|
|
|
|
80000230 <vx_reschedule_warps>:
|
|
80000230: fd010113 addi sp,sp,-48
|
|
80000234: 02112623 sw ra,44(sp)
|
|
80000238: 02812423 sw s0,40(sp)
|
|
8000023c: 03a12223 sw s10,36(sp)
|
|
80000240: 03010413 addi s0,sp,48
|
|
80000244: 000d0713 mv a4,s10
|
|
80000248: 4c400793 li a5,1220
|
|
8000024c: 02f70733 mul a4,a4,a5
|
|
80000250: 810007b7 lui a5,0x81000
|
|
80000254: 31c78793 addi a5,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
80000258: 00f707b3 add a5,a4,a5
|
|
8000025c: 00078513 mv a0,a5
|
|
80000260: 4b8000ef jal ra,80000718 <queue_isEmpty>
|
|
80000264: 00050793 mv a5,a0
|
|
80000268: 02078a63 beqz a5,8000029c <vx_reschedule_warps+0x6c>
|
|
8000026c: 000d0713 mv a4,s10
|
|
80000270: 810007b7 lui a5,0x81000
|
|
80000274: 00271713 slli a4,a4,0x2
|
|
80000278: 27c78793 addi a5,a5,636 # 8100027c <main_sp+0xffffa8c0>
|
|
8000027c: 00f707b3 add a5,a4,a5
|
|
80000280: 00100713 li a4,1
|
|
80000284: 00e7a023 sw a4,0(a5)
|
|
80000288: 000d0793 mv a5,s10
|
|
8000028c: 00079663 bnez a5,80000298 <vx_reschedule_warps+0x68>
|
|
80000290: e9dff0ef jal ra,8000012c <vx_load_context>
|
|
80000294: 0580006f j 800002ec <vx_reschedule_warps+0xbc>
|
|
80000298: 00000073 ecall
|
|
8000029c: 000d0713 mv a4,s10
|
|
800002a0: 4c400793 li a5,1220
|
|
800002a4: 02f70733 mul a4,a4,a5
|
|
800002a8: 810007b7 lui a5,0x81000
|
|
800002ac: 31c78793 addi a5,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
800002b0: 00f707b3 add a5,a4,a5
|
|
800002b4: fd840713 addi a4,s0,-40
|
|
800002b8: 00070593 mv a1,a4
|
|
800002bc: 00078513 mv a0,a5
|
|
800002c0: 3d0000ef jal ra,80000690 <queue_dequeue>
|
|
800002c4: fe042783 lw a5,-32(s0)
|
|
800002c8: 00078113 mv sp,a5
|
|
800002cc: fdc42783 lw a5,-36(s0)
|
|
800002d0: fd842583 lw a1,-40(s0)
|
|
800002d4: fe442603 lw a2,-28(s0)
|
|
800002d8: fe842683 lw a3,-24(s0)
|
|
800002dc: fec42703 lw a4,-20(s0)
|
|
800002e0: 00078513 mv a0,a5
|
|
800002e4: d45ff0ef jal ra,80000028 <vx_createThreads>
|
|
800002e8: 00000073 ecall
|
|
800002ec: 02c12083 lw ra,44(sp)
|
|
800002f0: 02812403 lw s0,40(sp)
|
|
800002f4: 02412d03 lw s10,36(sp)
|
|
800002f8: 03010113 addi sp,sp,48
|
|
800002fc: 00008067 ret
|
|
|
|
80000300 <vx_schedule_warps>:
|
|
80000300: fb010113 addi sp,sp,-80
|
|
80000304: 04112623 sw ra,76(sp)
|
|
80000308: 04812423 sw s0,72(sp)
|
|
8000030c: 05010413 addi s0,sp,80
|
|
80000310: eadff0ef jal ra,800001bc <vx_available_warps>
|
|
80000314: fea42423 sw a0,-24(s0)
|
|
80000318: 00010993 mv s3,sp
|
|
8000031c: 00100793 li a5,1
|
|
80000320: fef42623 sw a5,-20(s0)
|
|
80000324: 0840006f j 800003a8 <vx_schedule_warps+0xa8>
|
|
80000328: fec42703 lw a4,-20(s0)
|
|
8000032c: 4c400793 li a5,1220
|
|
80000330: 02f70733 mul a4,a4,a5
|
|
80000334: 810007b7 lui a5,0x81000
|
|
80000338: 31c78793 addi a5,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
8000033c: 00f707b3 add a5,a4,a5
|
|
80000340: 00078513 mv a0,a5
|
|
80000344: 3d4000ef jal ra,80000718 <queue_isEmpty>
|
|
80000348: 00050793 mv a5,a0
|
|
8000034c: 04079863 bnez a5,8000039c <vx_schedule_warps+0x9c>
|
|
80000350: fec42703 lw a4,-20(s0)
|
|
80000354: 4c400793 li a5,1220
|
|
80000358: 02f70733 mul a4,a4,a5
|
|
8000035c: 810007b7 lui a5,0x81000
|
|
80000360: 31c78793 addi a5,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
80000364: 00f707b3 add a5,a4,a5
|
|
80000368: fd040713 addi a4,s0,-48
|
|
8000036c: 00070593 mv a1,a4
|
|
80000370: 00078513 mv a0,a5
|
|
80000374: 31c000ef jal ra,80000690 <queue_dequeue>
|
|
80000378: fd842783 lw a5,-40(s0)
|
|
8000037c: 00078113 mv sp,a5
|
|
80000380: fd442783 lw a5,-44(s0)
|
|
80000384: fd042583 lw a1,-48(s0)
|
|
80000388: fdc42603 lw a2,-36(s0)
|
|
8000038c: fe042683 lw a3,-32(s0)
|
|
80000390: fe442703 lw a4,-28(s0)
|
|
80000394: 00078513 mv a0,a5
|
|
80000398: cf5ff0ef jal ra,8000008c <vx_wspawn>
|
|
8000039c: fec42783 lw a5,-20(s0)
|
|
800003a0: 00178793 addi a5,a5,1
|
|
800003a4: fef42623 sw a5,-20(s0)
|
|
800003a8: fec42783 lw a5,-20(s0)
|
|
800003ac: fe842703 lw a4,-24(s0)
|
|
800003b0: f6e7ece3 bltu a5,a4,80000328 <vx_schedule_warps+0x28>
|
|
800003b4: 00098113 mv sp,s3
|
|
800003b8: ce5ff0ef jal ra,8000009c <vx_save_context>
|
|
800003bc: 00020793 mv a5,tp
|
|
800003c0: 04078863 beqz a5,80000410 <vx_schedule_warps+0x110>
|
|
800003c4: 810007b7 lui a5,0x81000
|
|
800003c8: 31c78513 addi a0,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
800003cc: 34c000ef jal ra,80000718 <queue_isEmpty>
|
|
800003d0: 00050793 mv a5,a0
|
|
800003d4: 02079e63 bnez a5,80000410 <vx_schedule_warps+0x110>
|
|
800003d8: fb840793 addi a5,s0,-72
|
|
800003dc: 00078593 mv a1,a5
|
|
800003e0: 810007b7 lui a5,0x81000
|
|
800003e4: 31c78513 addi a0,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
800003e8: 2a8000ef jal ra,80000690 <queue_dequeue>
|
|
800003ec: fc042783 lw a5,-64(s0)
|
|
800003f0: 00078113 mv sp,a5
|
|
800003f4: fbc42783 lw a5,-68(s0)
|
|
800003f8: fb842583 lw a1,-72(s0)
|
|
800003fc: fc442603 lw a2,-60(s0)
|
|
80000400: fc842683 lw a3,-56(s0)
|
|
80000404: fcc42703 lw a4,-52(s0)
|
|
80000408: 00078513 mv a0,a5
|
|
8000040c: c1dff0ef jal ra,80000028 <vx_createThreads>
|
|
80000410: 00000013 nop
|
|
80000414: 04c12083 lw ra,76(sp)
|
|
80000418: 04812403 lw s0,72(sp)
|
|
8000041c: 05010113 addi sp,sp,80
|
|
80000420: 00008067 ret
|
|
|
|
80000424 <vx_spawnWarps>:
|
|
80000424: fb010113 addi sp,sp,-80
|
|
80000428: 04112623 sw ra,76(sp)
|
|
8000042c: 04812423 sw s0,72(sp)
|
|
80000430: 05010413 addi s0,sp,80
|
|
80000434: faa42e23 sw a0,-68(s0)
|
|
80000438: fab42c23 sw a1,-72(s0)
|
|
8000043c: fac42a23 sw a2,-76(s0)
|
|
80000440: fad42823 sw a3,-80(s0)
|
|
80000444: d89ff0ef jal ra,800001cc <vx_before_main>
|
|
80000448: d75ff0ef jal ra,800001bc <vx_available_warps>
|
|
8000044c: fea42223 sw a0,-28(s0)
|
|
80000450: 00010913 mv s2,sp
|
|
80000454: fe042623 sw zero,-20(s0)
|
|
80000458: fe042423 sw zero,-24(s0)
|
|
8000045c: 08c0006f j 800004e8 <vx_spawnWarps+0xc4>
|
|
80000460: ffff09b7 lui s3,0xffff0
|
|
80000464: 01310133 add sp,sp,s3
|
|
80000468: fe842783 lw a5,-24(s0)
|
|
8000046c: fcf42623 sw a5,-52(s0)
|
|
80000470: fb842783 lw a5,-72(s0)
|
|
80000474: fcf42823 sw a5,-48(s0)
|
|
80000478: 00010793 mv a5,sp
|
|
8000047c: fcf42a23 sw a5,-44(s0)
|
|
80000480: fb442783 lw a5,-76(s0)
|
|
80000484: fcf42c23 sw a5,-40(s0)
|
|
80000488: fb042783 lw a5,-80(s0)
|
|
8000048c: fcf42e23 sw a5,-36(s0)
|
|
80000490: fec42783 lw a5,-20(s0)
|
|
80000494: fef42023 sw a5,-32(s0)
|
|
80000498: fec42703 lw a4,-20(s0)
|
|
8000049c: 4c400793 li a5,1220
|
|
800004a0: 02f70733 mul a4,a4,a5
|
|
800004a4: 810007b7 lui a5,0x81000
|
|
800004a8: 31c78793 addi a5,a5,796 # 8100031c <main_sp+0xffffa960>
|
|
800004ac: 00f707b3 add a5,a4,a5
|
|
800004b0: fcc40713 addi a4,s0,-52
|
|
800004b4: 00070593 mv a1,a4
|
|
800004b8: 00078513 mv a0,a5
|
|
800004bc: 16c000ef jal ra,80000628 <queue_enqueue>
|
|
800004c0: fec42783 lw a5,-20(s0)
|
|
800004c4: 00178793 addi a5,a5,1
|
|
800004c8: fef42623 sw a5,-20(s0)
|
|
800004cc: fec42783 lw a5,-20(s0)
|
|
800004d0: fe442703 lw a4,-28(s0)
|
|
800004d4: 00e7e463 bltu a5,a4,800004dc <vx_spawnWarps+0xb8>
|
|
800004d8: fe042623 sw zero,-20(s0)
|
|
800004dc: fe842783 lw a5,-24(s0)
|
|
800004e0: 00178793 addi a5,a5,1
|
|
800004e4: fef42423 sw a5,-24(s0)
|
|
800004e8: fe842703 lw a4,-24(s0)
|
|
800004ec: fbc42783 lw a5,-68(s0)
|
|
800004f0: f6f768e3 bltu a4,a5,80000460 <vx_spawnWarps+0x3c>
|
|
800004f4: 00090113 mv sp,s2
|
|
800004f8: e09ff0ef jal ra,80000300 <vx_schedule_warps>
|
|
800004fc: 00000013 nop
|
|
80000500: 04c12083 lw ra,76(sp)
|
|
80000504: 04812403 lw s0,72(sp)
|
|
80000508: 05010113 addi sp,sp,80
|
|
8000050c: 00008067 ret
|
|
|
|
80000510 <vx_wait_for_warps>:
|
|
80000510: fd010113 addi sp,sp,-48
|
|
80000514: 02112623 sw ra,44(sp)
|
|
80000518: 02812423 sw s0,40(sp)
|
|
8000051c: 03010413 addi s0,sp,48
|
|
80000520: fca42e23 sw a0,-36(s0)
|
|
80000524: c99ff0ef jal ra,800001bc <vx_available_warps>
|
|
80000528: fea42023 sw a0,-32(s0)
|
|
8000052c: fe042623 sw zero,-20(s0)
|
|
80000530: 0540006f j 80000584 <vx_wait_for_warps+0x74>
|
|
80000534: fe042623 sw zero,-20(s0)
|
|
80000538: fe042423 sw zero,-24(s0)
|
|
8000053c: 03c0006f j 80000578 <vx_wait_for_warps+0x68>
|
|
80000540: 810007b7 lui a5,0x81000
|
|
80000544: fe842703 lw a4,-24(s0)
|
|
80000548: 00271713 slli a4,a4,0x2
|
|
8000054c: 27c78793 addi a5,a5,636 # 8100027c <main_sp+0xffffa8c0>
|
|
80000550: 00f707b3 add a5,a4,a5
|
|
80000554: 0007a703 lw a4,0(a5)
|
|
80000558: 00100793 li a5,1
|
|
8000055c: 00f71863 bne a4,a5,8000056c <vx_wait_for_warps+0x5c>
|
|
80000560: fec42783 lw a5,-20(s0)
|
|
80000564: 00178793 addi a5,a5,1
|
|
80000568: fef42623 sw a5,-20(s0)
|
|
8000056c: fe842783 lw a5,-24(s0)
|
|
80000570: 00178793 addi a5,a5,1
|
|
80000574: fef42423 sw a5,-24(s0)
|
|
80000578: fe842783 lw a5,-24(s0)
|
|
8000057c: fe042703 lw a4,-32(s0)
|
|
80000580: fce7e0e3 bltu a5,a4,80000540 <vx_wait_for_warps+0x30>
|
|
80000584: fec42703 lw a4,-20(s0)
|
|
80000588: fdc42783 lw a5,-36(s0)
|
|
8000058c: faf714e3 bne a4,a5,80000534 <vx_wait_for_warps+0x24>
|
|
80000590: fe042223 sw zero,-28(s0)
|
|
80000594: 0280006f j 800005bc <vx_wait_for_warps+0xac>
|
|
80000598: 810007b7 lui a5,0x81000
|
|
8000059c: fe442703 lw a4,-28(s0)
|
|
800005a0: 00271713 slli a4,a4,0x2
|
|
800005a4: 27c78793 addi a5,a5,636 # 8100027c <main_sp+0xffffa8c0>
|
|
800005a8: 00f707b3 add a5,a4,a5
|
|
800005ac: 0007a023 sw zero,0(a5)
|
|
800005b0: fe442783 lw a5,-28(s0)
|
|
800005b4: 00178793 addi a5,a5,1
|
|
800005b8: fef42223 sw a5,-28(s0)
|
|
800005bc: fe442783 lw a5,-28(s0)
|
|
800005c0: fe042703 lw a4,-32(s0)
|
|
800005c4: fce7eae3 bltu a5,a4,80000598 <vx_wait_for_warps+0x88>
|
|
800005c8: 00000013 nop
|
|
800005cc: 02c12083 lw ra,44(sp)
|
|
800005d0: 02812403 lw s0,40(sp)
|
|
800005d4: 03010113 addi sp,sp,48
|
|
800005d8: 00008067 ret
|
|
|
|
800005dc <vx_get_arg_struct>:
|
|
800005dc: ff010113 addi sp,sp,-16
|
|
800005e0: 00812623 sw s0,12(sp)
|
|
800005e4: 01712423 sw s7,8(sp)
|
|
800005e8: 01010413 addi s0,sp,16
|
|
800005ec: 000b8793 mv a5,s7
|
|
800005f0: 00078513 mv a0,a5
|
|
800005f4: 00c12403 lw s0,12(sp)
|
|
800005f8: 00812b83 lw s7,8(sp)
|
|
800005fc: 01010113 addi sp,sp,16
|
|
80000600: 00008067 ret
|
|
|
|
80000604 <queue_initialize>:
|
|
80000604: 00050293 mv t0,a0
|
|
80000608: 00000313 li t1,0
|
|
8000060c: 00700393 li t2,7
|
|
80000610: 0062a023 sw t1,0(t0)
|
|
80000614: 0062a223 sw t1,4(t0)
|
|
80000618: 0062a423 sw t1,8(t0)
|
|
8000061c: 0072a623 sw t2,12(t0)
|
|
80000620: 0062a823 sw t1,16(t0)
|
|
80000624: 00008067 ret
|
|
|
|
80000628 <queue_enqueue>:
|
|
80000628: 00050293 mv t0,a0
|
|
8000062c: 0082a303 lw t1,8(t0)
|
|
80000630: 00130313 addi t1,t1,1
|
|
80000634: 0062a423 sw t1,8(t0)
|
|
80000638: 01428313 addi t1,t0,20
|
|
8000063c: 0042ae83 lw t4,4(t0)
|
|
80000640: 005e9393 slli t2,t4,0x5
|
|
80000644: 00730333 add t1,t1,t2
|
|
80000648: 0005ae03 lw t3,0(a1)
|
|
8000064c: 01c32023 sw t3,0(t1)
|
|
80000650: 0045ae03 lw t3,4(a1)
|
|
80000654: 01c32223 sw t3,4(t1)
|
|
80000658: 0085ae03 lw t3,8(a1)
|
|
8000065c: 01c32423 sw t3,8(t1)
|
|
80000660: 00c5ae03 lw t3,12(a1)
|
|
80000664: 01c32623 sw t3,12(t1)
|
|
80000668: 0105ae03 lw t3,16(a1)
|
|
8000066c: 01c32823 sw t3,16(t1)
|
|
80000670: 0145ae03 lw t3,20(a1)
|
|
80000674: 01c32a23 sw t3,20(t1)
|
|
80000678: 001e8e93 addi t4,t4,1
|
|
8000067c: 03200f13 li t5,50
|
|
80000680: 01ee9463 bne t4,t5,80000688 <ec>
|
|
80000684: 00000e93 li t4,0
|
|
|
|
80000688 <ec>:
|
|
80000688: 01d2a223 sw t4,4(t0)
|
|
8000068c: 00008067 ret
|
|
|
|
80000690 <queue_dequeue>:
|
|
80000690: 00050293 mv t0,a0
|
|
80000694: 0082a303 lw t1,8(t0)
|
|
80000698: fff30313 addi t1,t1,-1
|
|
8000069c: 0062a423 sw t1,8(t0)
|
|
800006a0: 01428313 addi t1,t0,20
|
|
800006a4: 0002ae83 lw t4,0(t0)
|
|
800006a8: 03200f93 li t6,50
|
|
800006ac: 000e8f13 mv t5,t4
|
|
800006b0: 001f0f13 addi t5,t5,1
|
|
800006b4: 01ff1463 bne t5,t6,800006bc <dc>
|
|
800006b8: 00000f13 li t5,0
|
|
|
|
800006bc <dc>:
|
|
800006bc: 01e2a023 sw t5,0(t0)
|
|
800006c0: 005e9393 slli t2,t4,0x5
|
|
800006c4: 00730333 add t1,t1,t2
|
|
800006c8: 00032e03 lw t3,0(t1)
|
|
800006cc: 01c5a023 sw t3,0(a1)
|
|
800006d0: 00432e03 lw t3,4(t1)
|
|
800006d4: 01c5a223 sw t3,4(a1)
|
|
800006d8: 00832e03 lw t3,8(t1)
|
|
800006dc: 01c5a423 sw t3,8(a1)
|
|
800006e0: 00c32e03 lw t3,12(t1)
|
|
800006e4: 01c5a623 sw t3,12(a1)
|
|
800006e8: 01032e03 lw t3,16(t1)
|
|
800006ec: 01c5a823 sw t3,16(a1)
|
|
800006f0: 01432e03 lw t3,20(t1)
|
|
800006f4: 01c5aa23 sw t3,20(a1)
|
|
800006f8: 00008067 ret
|
|
|
|
800006fc <queue_isFull>:
|
|
800006fc: 00050293 mv t0,a0
|
|
80000700: 0082a303 lw t1,8(t0)
|
|
80000704: 00000513 li a0,0
|
|
80000708: 03200e13 li t3,50
|
|
8000070c: 006e1463 bne t3,t1,80000714 <qf>
|
|
80000710: 00150513 addi a0,a0,1
|
|
|
|
80000714 <qf>:
|
|
80000714: 00008067 ret
|
|
|
|
80000718 <queue_isEmpty>:
|
|
80000718: 00050293 mv t0,a0
|
|
8000071c: 0082a303 lw t1,8(t0)
|
|
80000720: 00000513 li a0,0
|
|
80000724: 00000e13 li t3,0
|
|
80000728: 006e1463 bne t3,t1,80000730 <qe>
|
|
8000072c: 00150513 addi a0,a0,1
|
|
|
|
80000730 <qe>:
|
|
80000730: 00008067 ret
|
|
|
|
80000734 <queue_availableWarps>:
|
|
80000734: 00050293 mv t0,a0
|
|
80000738: 00c2a303 lw t1,12(t0)
|
|
8000073c: 0102a383 lw t2,16(t0)
|
|
80000740: 0063b533 sltu a0,t2,t1
|
|
80000744: 00008067 ret
|
|
|
|
80000748 <vx_print_str>:
|
|
80000748: ff410113 addi sp,sp,-12
|
|
8000074c: 00112023 sw ra,0(sp)
|
|
80000750: 00b12223 sw a1,4(sp)
|
|
|
|
80000754 <bl>:
|
|
80000754: 00054583 lbu a1,0(a0)
|
|
80000758: 00058863 beqz a1,80000768 <be>
|
|
8000075c: 01c000ef jal ra,80000778 <vx_printc>
|
|
80000760: 00150513 addi a0,a0,1
|
|
80000764: ff1ff06f j 80000754 <bl>
|
|
|
|
80000768 <be>:
|
|
80000768: 00012083 lw ra,0(sp)
|
|
8000076c: 00412583 lw a1,4(sp)
|
|
80000770: 00c10113 addi sp,sp,12
|
|
80000774: 00008067 ret
|
|
|
|
80000778 <vx_printc>:
|
|
80000778: 000108b7 lui a7,0x10
|
|
8000077c: 00b8a023 sw a1,0(a7) # 10000 <SIZE+0xffce>
|
|
80000780: 00008067 ret
|
|
|
|
80000784 <vx_print_hex>:
|
|
80000784: fd010113 addi sp,sp,-48
|
|
80000788: 02112623 sw ra,44(sp)
|
|
8000078c: 02812423 sw s0,40(sp)
|
|
80000790: 03010413 addi s0,sp,48
|
|
80000794: fca42e23 sw a0,-36(s0)
|
|
80000798: fdc42703 lw a4,-36(s0)
|
|
8000079c: 00f00793 li a5,15
|
|
800007a0: 02e7e463 bltu a5,a4,800007c8 <vx_print_hex+0x44>
|
|
800007a4: 810007b7 lui a5,0x81000
|
|
800007a8: fdc42703 lw a4,-36(s0)
|
|
800007ac: 00271713 slli a4,a4,0x2
|
|
800007b0: 1bc78793 addi a5,a5,444 # 810001bc <main_sp+0xffffa800>
|
|
800007b4: 00f707b3 add a5,a4,a5
|
|
800007b8: 0007a783 lw a5,0(a5)
|
|
800007bc: 00078513 mv a0,a5
|
|
800007c0: f89ff0ef jal ra,80000748 <vx_print_str>
|
|
800007c4: 0740006f j 80000838 <vx_print_hex+0xb4>
|
|
800007c8: 02000793 li a5,32
|
|
800007cc: fef42623 sw a5,-20(s0)
|
|
800007d0: fe0405a3 sb zero,-21(s0)
|
|
800007d4: fec42783 lw a5,-20(s0)
|
|
800007d8: ffc78793 addi a5,a5,-4
|
|
800007dc: fdc42703 lw a4,-36(s0)
|
|
800007e0: 00f757b3 srl a5,a4,a5
|
|
800007e4: 00f7f793 andi a5,a5,15
|
|
800007e8: fef42223 sw a5,-28(s0)
|
|
800007ec: fe442783 lw a5,-28(s0)
|
|
800007f0: 00078663 beqz a5,800007fc <vx_print_hex+0x78>
|
|
800007f4: 00100793 li a5,1
|
|
800007f8: fef405a3 sb a5,-21(s0)
|
|
800007fc: feb44783 lbu a5,-21(s0)
|
|
80000800: 02078263 beqz a5,80000824 <vx_print_hex+0xa0>
|
|
80000804: 810007b7 lui a5,0x81000
|
|
80000808: fe442703 lw a4,-28(s0)
|
|
8000080c: 00271713 slli a4,a4,0x2
|
|
80000810: 1bc78793 addi a5,a5,444 # 810001bc <main_sp+0xffffa800>
|
|
80000814: 00f707b3 add a5,a4,a5
|
|
80000818: 0007a783 lw a5,0(a5)
|
|
8000081c: 00078513 mv a0,a5
|
|
80000820: f29ff0ef jal ra,80000748 <vx_print_str>
|
|
80000824: fec42783 lw a5,-20(s0)
|
|
80000828: ffc78793 addi a5,a5,-4
|
|
8000082c: fef42623 sw a5,-20(s0)
|
|
80000830: fec42783 lw a5,-20(s0)
|
|
80000834: faf040e3 bgtz a5,800007d4 <vx_print_hex+0x50>
|
|
80000838: 02c12083 lw ra,44(sp)
|
|
8000083c: 02812403 lw s0,40(sp)
|
|
80000840: 03010113 addi sp,sp,48
|
|
80000844: 00008067 ret
|
|
|
|
80000848 <vx_printf>:
|
|
80000848: fe010113 addi sp,sp,-32
|
|
8000084c: 00112e23 sw ra,28(sp)
|
|
80000850: 00812c23 sw s0,24(sp)
|
|
80000854: 02010413 addi s0,sp,32
|
|
80000858: fea42623 sw a0,-20(s0)
|
|
8000085c: feb42423 sw a1,-24(s0)
|
|
80000860: fec42503 lw a0,-20(s0)
|
|
80000864: ee5ff0ef jal ra,80000748 <vx_print_str>
|
|
80000868: fe842503 lw a0,-24(s0)
|
|
8000086c: f19ff0ef jal ra,80000784 <vx_print_hex>
|
|
80000870: 810007b7 lui a5,0x81000
|
|
80000874: 08078513 addi a0,a5,128 # 81000080 <main_sp+0xffffa6c4>
|
|
80000878: ed1ff0ef jal ra,80000748 <vx_print_str>
|
|
8000087c: 00000013 nop
|
|
80000880: 01c12083 lw ra,28(sp)
|
|
80000884: 01812403 lw s0,24(sp)
|
|
80000888: 02010113 addi sp,sp,32
|
|
8000088c: 00008067 ret
|
|
|
|
80000890 <vx_sq_mat_mult>:
|
|
80000890: fd010113 addi sp,sp,-48
|
|
80000894: 02112623 sw ra,44(sp)
|
|
80000898: 02812423 sw s0,40(sp)
|
|
8000089c: 03010413 addi s0,sp,48
|
|
800008a0: fca42e23 sw a0,-36(s0)
|
|
800008a4: fcb42c23 sw a1,-40(s0)
|
|
800008a8: fcc42a23 sw a2,-44(s0)
|
|
800008ac: fcd42823 sw a3,-48(s0)
|
|
800008b0: 810037b7 lui a5,0x81003
|
|
800008b4: fdc42703 lw a4,-36(s0)
|
|
800008b8: 94e7ae23 sw a4,-1700(a5) # 8100295c <main_sp+0xffffcfa0>
|
|
800008bc: 810037b7 lui a5,0x81003
|
|
800008c0: 95c78793 addi a5,a5,-1700 # 8100295c <main_sp+0xffffcfa0>
|
|
800008c4: fd842703 lw a4,-40(s0)
|
|
800008c8: 00e7a223 sw a4,4(a5)
|
|
800008cc: 810037b7 lui a5,0x81003
|
|
800008d0: 95c78793 addi a5,a5,-1700 # 8100295c <main_sp+0xffffcfa0>
|
|
800008d4: fd442703 lw a4,-44(s0)
|
|
800008d8: 00e7a423 sw a4,8(a5)
|
|
800008dc: 810037b7 lui a5,0x81003
|
|
800008e0: 95c78793 addi a5,a5,-1700 # 8100295c <main_sp+0xffffcfa0>
|
|
800008e4: fd042703 lw a4,-48(s0)
|
|
800008e8: 00e7a623 sw a4,12(a5)
|
|
800008ec: 8d9ff0ef jal ra,800001c4 <vx_available_threads>
|
|
800008f0: fea42423 sw a0,-24(s0)
|
|
800008f4: fd042703 lw a4,-48(s0)
|
|
800008f8: fe842783 lw a5,-24(s0)
|
|
800008fc: 02f757b3 divu a5,a4,a5
|
|
80000900: fef42623 sw a5,-20(s0)
|
|
80000904: fd042703 lw a4,-48(s0)
|
|
80000908: fe842783 lw a5,-24(s0)
|
|
8000090c: 02f777b3 remu a5,a4,a5
|
|
80000910: 00078863 beqz a5,80000920 <vx_sq_mat_mult+0x90>
|
|
80000914: fec42783 lw a5,-20(s0)
|
|
80000918: 00178793 addi a5,a5,1
|
|
8000091c: fef42623 sw a5,-20(s0)
|
|
80000920: fec42583 lw a1,-20(s0)
|
|
80000924: 810007b7 lui a5,0x81000
|
|
80000928: 0c478513 addi a0,a5,196 # 810000c4 <main_sp+0xffffa708>
|
|
8000092c: f1dff0ef jal ra,80000848 <vx_printf>
|
|
80000930: 810037b7 lui a5,0x81003
|
|
80000934: 95c78793 addi a5,a5,-1700 # 8100295c <main_sp+0xffffcfa0>
|
|
80000938: fec42703 lw a4,-20(s0)
|
|
8000093c: 00e7a823 sw a4,16(a5)
|
|
80000940: fd042703 lw a4,-48(s0)
|
|
80000944: fe842783 lw a5,-24(s0)
|
|
80000948: 02f76263 bltu a4,a5,8000096c <vx_sq_mat_mult+0xdc>
|
|
8000094c: 810037b7 lui a5,0x81003
|
|
80000950: 95c78693 addi a3,a5,-1700 # 8100295c <main_sp+0xffffcfa0>
|
|
80000954: 800017b7 lui a5,0x80001
|
|
80000958: 9c478613 addi a2,a5,-1596 # 800009c4 <main_sp+0xfeffb008>
|
|
8000095c: fe842583 lw a1,-24(s0)
|
|
80000960: fd042503 lw a0,-48(s0)
|
|
80000964: ac1ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80000968: 0200006f j 80000988 <vx_sq_mat_mult+0xf8>
|
|
8000096c: 810037b7 lui a5,0x81003
|
|
80000970: 95c78693 addi a3,a5,-1700 # 8100295c <main_sp+0xffffcfa0>
|
|
80000974: 800017b7 lui a5,0x80001
|
|
80000978: 9c478613 addi a2,a5,-1596 # 800009c4 <main_sp+0xfeffb008>
|
|
8000097c: fd042583 lw a1,-48(s0)
|
|
80000980: fd042503 lw a0,-48(s0)
|
|
80000984: aa1ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80000988: 835ff0ef jal ra,800001bc <vx_available_warps>
|
|
8000098c: fea42223 sw a0,-28(s0)
|
|
80000990: fd042703 lw a4,-48(s0)
|
|
80000994: fe442783 lw a5,-28(s0)
|
|
80000998: 00e7f863 bgeu a5,a4,800009a8 <vx_sq_mat_mult+0x118>
|
|
8000099c: fe442503 lw a0,-28(s0)
|
|
800009a0: b71ff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
800009a4: 00c0006f j 800009b0 <vx_sq_mat_mult+0x120>
|
|
800009a8: fd042503 lw a0,-48(s0)
|
|
800009ac: b65ff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
800009b0: 00000013 nop
|
|
800009b4: 02c12083 lw ra,44(sp)
|
|
800009b8: 02812403 lw s0,40(sp)
|
|
800009bc: 03010113 addi sp,sp,48
|
|
800009c0: 00008067 ret
|
|
|
|
800009c4 <_vx_mat_mult>:
|
|
800009c4: fa010113 addi sp,sp,-96
|
|
800009c8: 04112e23 sw ra,92(sp)
|
|
800009cc: 04812c23 sw s0,88(sp)
|
|
800009d0: 06010413 addi s0,sp,96
|
|
800009d4: faa42623 sw a0,-84(s0)
|
|
800009d8: fab42423 sw a1,-88(s0)
|
|
800009dc: c01ff0ef jal ra,800005dc <vx_get_arg_struct>
|
|
800009e0: fca42c23 sw a0,-40(s0)
|
|
800009e4: fd842783 lw a5,-40(s0)
|
|
800009e8: 0007a783 lw a5,0(a5)
|
|
800009ec: fcf42a23 sw a5,-44(s0)
|
|
800009f0: fd842783 lw a5,-40(s0)
|
|
800009f4: 0047a783 lw a5,4(a5)
|
|
800009f8: fcf42823 sw a5,-48(s0)
|
|
800009fc: fd842783 lw a5,-40(s0)
|
|
80000a00: 0087a783 lw a5,8(a5)
|
|
80000a04: fcf42623 sw a5,-52(s0)
|
|
80000a08: fd842783 lw a5,-40(s0)
|
|
80000a0c: 0107a783 lw a5,16(a5)
|
|
80000a10: fef42623 sw a5,-20(s0)
|
|
80000a14: fec42703 lw a4,-20(s0)
|
|
80000a18: fac42783 lw a5,-84(s0)
|
|
80000a1c: 02f707b3 mul a5,a4,a5
|
|
80000a20: fef42423 sw a5,-24(s0)
|
|
80000a24: fec42783 lw a5,-20(s0)
|
|
80000a28: 00079a63 bnez a5,80000a3c <_vx_mat_mult+0x78>
|
|
80000a2c: 00100793 li a5,1
|
|
80000a30: fef42623 sw a5,-20(s0)
|
|
80000a34: fac42783 lw a5,-84(s0)
|
|
80000a38: fef42423 sw a5,-24(s0)
|
|
80000a3c: fd842783 lw a5,-40(s0)
|
|
80000a40: 00c7a783 lw a5,12(a5)
|
|
80000a44: fcf42423 sw a5,-56(s0)
|
|
80000a48: fe042223 sw zero,-28(s0)
|
|
80000a4c: 0d80006f j 80000b24 <_vx_mat_mult+0x160>
|
|
80000a50: fe042023 sw zero,-32(s0)
|
|
80000a54: fc042e23 sw zero,-36(s0)
|
|
80000a58: 0780006f j 80000ad0 <_vx_mat_mult+0x10c>
|
|
80000a5c: fa842703 lw a4,-88(s0)
|
|
80000a60: fc842783 lw a5,-56(s0)
|
|
80000a64: 02f707b3 mul a5,a4,a5
|
|
80000a68: fdc42703 lw a4,-36(s0)
|
|
80000a6c: 00f707b3 add a5,a4,a5
|
|
80000a70: fcf42223 sw a5,-60(s0)
|
|
80000a74: fc842703 lw a4,-56(s0)
|
|
80000a78: fdc42783 lw a5,-36(s0)
|
|
80000a7c: 02f707b3 mul a5,a4,a5
|
|
80000a80: fe842703 lw a4,-24(s0)
|
|
80000a84: 00f707b3 add a5,a4,a5
|
|
80000a88: fcf42023 sw a5,-64(s0)
|
|
80000a8c: fc442783 lw a5,-60(s0)
|
|
80000a90: 00279793 slli a5,a5,0x2
|
|
80000a94: fd442703 lw a4,-44(s0)
|
|
80000a98: 00f707b3 add a5,a4,a5
|
|
80000a9c: 0007a703 lw a4,0(a5)
|
|
80000aa0: fc042783 lw a5,-64(s0)
|
|
80000aa4: 00279793 slli a5,a5,0x2
|
|
80000aa8: fd042683 lw a3,-48(s0)
|
|
80000aac: 00f687b3 add a5,a3,a5
|
|
80000ab0: 0007a783 lw a5,0(a5)
|
|
80000ab4: 02f707b3 mul a5,a4,a5
|
|
80000ab8: fe042703 lw a4,-32(s0)
|
|
80000abc: 00f707b3 add a5,a4,a5
|
|
80000ac0: fef42023 sw a5,-32(s0)
|
|
80000ac4: fdc42783 lw a5,-36(s0)
|
|
80000ac8: 00178793 addi a5,a5,1
|
|
80000acc: fcf42e23 sw a5,-36(s0)
|
|
80000ad0: fdc42703 lw a4,-36(s0)
|
|
80000ad4: fc842783 lw a5,-56(s0)
|
|
80000ad8: f8f762e3 bltu a4,a5,80000a5c <_vx_mat_mult+0x98>
|
|
80000adc: fa842703 lw a4,-88(s0)
|
|
80000ae0: fc842783 lw a5,-56(s0)
|
|
80000ae4: 02f70733 mul a4,a4,a5
|
|
80000ae8: fe842783 lw a5,-24(s0)
|
|
80000aec: 00f707b3 add a5,a4,a5
|
|
80000af0: faf42e23 sw a5,-68(s0)
|
|
80000af4: fbc42783 lw a5,-68(s0)
|
|
80000af8: 00279793 slli a5,a5,0x2
|
|
80000afc: fcc42703 lw a4,-52(s0)
|
|
80000b00: 00f707b3 add a5,a4,a5
|
|
80000b04: fe042703 lw a4,-32(s0)
|
|
80000b08: 00e7a023 sw a4,0(a5)
|
|
80000b0c: fe842783 lw a5,-24(s0)
|
|
80000b10: 00178793 addi a5,a5,1
|
|
80000b14: fef42423 sw a5,-24(s0)
|
|
80000b18: fe442783 lw a5,-28(s0)
|
|
80000b1c: 00178793 addi a5,a5,1
|
|
80000b20: fef42223 sw a5,-28(s0)
|
|
80000b24: fe442783 lw a5,-28(s0)
|
|
80000b28: fec42703 lw a4,-20(s0)
|
|
80000b2c: f2e7e2e3 bltu a5,a4,80000a50 <_vx_mat_mult+0x8c>
|
|
80000b30: 00000013 nop
|
|
80000b34: 05c12083 lw ra,92(sp)
|
|
80000b38: 05812403 lw s0,88(sp)
|
|
80000b3c: 06010113 addi sp,sp,96
|
|
80000b40: 00008067 ret
|
|
|
|
80000b44 <vx_mat_add>:
|
|
80000b44: fc010113 addi sp,sp,-64
|
|
80000b48: 02112e23 sw ra,60(sp)
|
|
80000b4c: 02812c23 sw s0,56(sp)
|
|
80000b50: 04010413 addi s0,sp,64
|
|
80000b54: fca42e23 sw a0,-36(s0)
|
|
80000b58: fcb42c23 sw a1,-40(s0)
|
|
80000b5c: fcc42a23 sw a2,-44(s0)
|
|
80000b60: fcd42823 sw a3,-48(s0)
|
|
80000b64: fce42623 sw a4,-52(s0)
|
|
80000b68: 810037b7 lui a5,0x81003
|
|
80000b6c: fdc42703 lw a4,-36(s0)
|
|
80000b70: 96e7a823 sw a4,-1680(a5) # 81002970 <main_sp+0xffffcfb4>
|
|
80000b74: 810037b7 lui a5,0x81003
|
|
80000b78: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000b7c: fd842703 lw a4,-40(s0)
|
|
80000b80: 00e7a223 sw a4,4(a5)
|
|
80000b84: 810037b7 lui a5,0x81003
|
|
80000b88: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000b8c: fd442703 lw a4,-44(s0)
|
|
80000b90: 00e7a423 sw a4,8(a5)
|
|
80000b94: 810037b7 lui a5,0x81003
|
|
80000b98: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000b9c: fcc42703 lw a4,-52(s0)
|
|
80000ba0: 00e7a623 sw a4,12(a5)
|
|
80000ba4: 810037b7 lui a5,0x81003
|
|
80000ba8: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000bac: fd042703 lw a4,-48(s0)
|
|
80000bb0: 00e7a823 sw a4,16(a5)
|
|
80000bb4: e10ff0ef jal ra,800001c4 <vx_available_threads>
|
|
80000bb8: fea42423 sw a0,-24(s0)
|
|
80000bbc: fcc42703 lw a4,-52(s0)
|
|
80000bc0: fe842783 lw a5,-24(s0)
|
|
80000bc4: 02f757b3 divu a5,a4,a5
|
|
80000bc8: fef42623 sw a5,-20(s0)
|
|
80000bcc: fcc42703 lw a4,-52(s0)
|
|
80000bd0: fe842783 lw a5,-24(s0)
|
|
80000bd4: 02f777b3 remu a5,a4,a5
|
|
80000bd8: 00078863 beqz a5,80000be8 <vx_mat_add+0xa4>
|
|
80000bdc: fec42783 lw a5,-20(s0)
|
|
80000be0: 00178793 addi a5,a5,1
|
|
80000be4: fef42623 sw a5,-20(s0)
|
|
80000be8: 810037b7 lui a5,0x81003
|
|
80000bec: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000bf0: fec42703 lw a4,-20(s0)
|
|
80000bf4: 00e7aa23 sw a4,20(a5)
|
|
80000bf8: fcc42703 lw a4,-52(s0)
|
|
80000bfc: fe842783 lw a5,-24(s0)
|
|
80000c00: 02f76263 bltu a4,a5,80000c24 <vx_mat_add+0xe0>
|
|
80000c04: 810037b7 lui a5,0x81003
|
|
80000c08: 97078693 addi a3,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000c0c: 800017b7 lui a5,0x80001
|
|
80000c10: c7c78613 addi a2,a5,-900 # 80000c7c <main_sp+0xfeffb2c0>
|
|
80000c14: fe842583 lw a1,-24(s0)
|
|
80000c18: fd042503 lw a0,-48(s0)
|
|
80000c1c: 809ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80000c20: 0200006f j 80000c40 <vx_mat_add+0xfc>
|
|
80000c24: 810037b7 lui a5,0x81003
|
|
80000c28: 97078693 addi a3,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000c2c: 800017b7 lui a5,0x80001
|
|
80000c30: c7c78613 addi a2,a5,-900 # 80000c7c <main_sp+0xfeffb2c0>
|
|
80000c34: fcc42583 lw a1,-52(s0)
|
|
80000c38: fd042503 lw a0,-48(s0)
|
|
80000c3c: fe8ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80000c40: d7cff0ef jal ra,800001bc <vx_available_warps>
|
|
80000c44: fea42223 sw a0,-28(s0)
|
|
80000c48: fd042703 lw a4,-48(s0)
|
|
80000c4c: fe442783 lw a5,-28(s0)
|
|
80000c50: 00e7f863 bgeu a5,a4,80000c60 <vx_mat_add+0x11c>
|
|
80000c54: fe442503 lw a0,-28(s0)
|
|
80000c58: 8b9ff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
80000c5c: 00c0006f j 80000c68 <vx_mat_add+0x124>
|
|
80000c60: fd042503 lw a0,-48(s0)
|
|
80000c64: 8adff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
80000c68: 00000013 nop
|
|
80000c6c: 03c12083 lw ra,60(sp)
|
|
80000c70: 03812403 lw s0,56(sp)
|
|
80000c74: 04010113 addi sp,sp,64
|
|
80000c78: 00008067 ret
|
|
|
|
80000c7c <_vx_mat_add>:
|
|
80000c7c: fb010113 addi sp,sp,-80
|
|
80000c80: 04112623 sw ra,76(sp)
|
|
80000c84: 04812423 sw s0,72(sp)
|
|
80000c88: 05010413 addi s0,sp,80
|
|
80000c8c: faa42e23 sw a0,-68(s0)
|
|
80000c90: fab42c23 sw a1,-72(s0)
|
|
80000c94: 949ff0ef jal ra,800005dc <vx_get_arg_struct>
|
|
80000c98: fea42023 sw a0,-32(s0)
|
|
80000c9c: fe042783 lw a5,-32(s0)
|
|
80000ca0: 0007a783 lw a5,0(a5)
|
|
80000ca4: fcf42e23 sw a5,-36(s0)
|
|
80000ca8: fe042783 lw a5,-32(s0)
|
|
80000cac: 0047a783 lw a5,4(a5)
|
|
80000cb0: fcf42c23 sw a5,-40(s0)
|
|
80000cb4: fe042783 lw a5,-32(s0)
|
|
80000cb8: 0087a783 lw a5,8(a5)
|
|
80000cbc: fcf42a23 sw a5,-44(s0)
|
|
80000cc0: fe042783 lw a5,-32(s0)
|
|
80000cc4: 0147a783 lw a5,20(a5)
|
|
80000cc8: fef42623 sw a5,-20(s0)
|
|
80000ccc: fec42703 lw a4,-20(s0)
|
|
80000cd0: fbc42783 lw a5,-68(s0)
|
|
80000cd4: 02f707b3 mul a5,a4,a5
|
|
80000cd8: fef42423 sw a5,-24(s0)
|
|
80000cdc: fec42783 lw a5,-20(s0)
|
|
80000ce0: 00079a63 bnez a5,80000cf4 <_vx_mat_add+0x78>
|
|
80000ce4: 00100793 li a5,1
|
|
80000ce8: fef42623 sw a5,-20(s0)
|
|
80000cec: fbc42783 lw a5,-68(s0)
|
|
80000cf0: fef42423 sw a5,-24(s0)
|
|
80000cf4: fe042783 lw a5,-32(s0)
|
|
80000cf8: 00c7a783 lw a5,12(a5)
|
|
80000cfc: fcf42823 sw a5,-48(s0)
|
|
80000d00: fe042223 sw zero,-28(s0)
|
|
80000d04: 0c00006f j 80000dc4 <_vx_mat_add+0x148>
|
|
80000d08: fb842703 lw a4,-72(s0)
|
|
80000d0c: fd042783 lw a5,-48(s0)
|
|
80000d10: 02f70733 mul a4,a4,a5
|
|
80000d14: fe842783 lw a5,-24(s0)
|
|
80000d18: 00f707b3 add a5,a4,a5
|
|
80000d1c: fcf42623 sw a5,-52(s0)
|
|
80000d20: fe842703 lw a4,-24(s0)
|
|
80000d24: fd042783 lw a5,-48(s0)
|
|
80000d28: 00f737b3 sltu a5,a4,a5
|
|
80000d2c: 0ff7f793 andi a5,a5,255
|
|
80000d30: fcf42423 sw a5,-56(s0)
|
|
80000d34: fc842783 lw a5,-56(s0)
|
|
80000d38: 0017b793 seqz a5,a5
|
|
80000d3c: fcf403a3 sb a5,-57(s0)
|
|
80000d40: fc744783 lbu a5,-57(s0)
|
|
80000d44: 00078f13 mv t5,a5
|
|
80000d48: 800017b7 lui a5,0x80001
|
|
80000d4c: db078f93 addi t6,a5,-592 # 80000db0 <main_sp+0xfeffb3f4>
|
|
80000d50: 000f206b 0xf206b
|
|
80000d54: 01ff707b 0x1ff707b
|
|
80000d58: fcc42783 lw a5,-52(s0)
|
|
80000d5c: 00279793 slli a5,a5,0x2
|
|
80000d60: fdc42703 lw a4,-36(s0)
|
|
80000d64: 00f707b3 add a5,a4,a5
|
|
80000d68: 0007a683 lw a3,0(a5)
|
|
80000d6c: fcc42783 lw a5,-52(s0)
|
|
80000d70: 00279793 slli a5,a5,0x2
|
|
80000d74: fd842703 lw a4,-40(s0)
|
|
80000d78: 00f707b3 add a5,a4,a5
|
|
80000d7c: 0007a703 lw a4,0(a5)
|
|
80000d80: fcc42783 lw a5,-52(s0)
|
|
80000d84: 00279793 slli a5,a5,0x2
|
|
80000d88: fd442603 lw a2,-44(s0)
|
|
80000d8c: 00f607b3 add a5,a2,a5
|
|
80000d90: 00e68733 add a4,a3,a4
|
|
80000d94: 00e7a023 sw a4,0(a5)
|
|
80000d98: fe842783 lw a5,-24(s0)
|
|
80000d9c: 00178793 addi a5,a5,1
|
|
80000da0: fef42423 sw a5,-24(s0)
|
|
80000da4: 800017b7 lui a5,0x80001
|
|
80000da8: db478e13 addi t3,a5,-588 # 80000db4 <main_sp+0xfeffb3f8>
|
|
80000dac: 000e0067 jr t3
|
|
80000db0: 00000013 nop
|
|
80000db4: 0000306b 0x306b
|
|
80000db8: fe442783 lw a5,-28(s0)
|
|
80000dbc: 00178793 addi a5,a5,1
|
|
80000dc0: fef42223 sw a5,-28(s0)
|
|
80000dc4: fe442783 lw a5,-28(s0)
|
|
80000dc8: fec42703 lw a4,-20(s0)
|
|
80000dcc: f2e7eee3 bltu a5,a4,80000d08 <_vx_mat_add+0x8c>
|
|
80000dd0: 00000013 nop
|
|
80000dd4: 04c12083 lw ra,76(sp)
|
|
80000dd8: 04812403 lw s0,72(sp)
|
|
80000ddc: 05010113 addi sp,sp,80
|
|
80000de0: 00008067 ret
|
|
|
|
80000de4 <vx_mat_sub>:
|
|
80000de4: fc010113 addi sp,sp,-64
|
|
80000de8: 02112e23 sw ra,60(sp)
|
|
80000dec: 02812c23 sw s0,56(sp)
|
|
80000df0: 04010413 addi s0,sp,64
|
|
80000df4: fca42e23 sw a0,-36(s0)
|
|
80000df8: fcb42c23 sw a1,-40(s0)
|
|
80000dfc: fcc42a23 sw a2,-44(s0)
|
|
80000e00: fcd42823 sw a3,-48(s0)
|
|
80000e04: fce42623 sw a4,-52(s0)
|
|
80000e08: 810037b7 lui a5,0x81003
|
|
80000e0c: fdc42703 lw a4,-36(s0)
|
|
80000e10: 96e7a823 sw a4,-1680(a5) # 81002970 <main_sp+0xffffcfb4>
|
|
80000e14: 810037b7 lui a5,0x81003
|
|
80000e18: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000e1c: fd842703 lw a4,-40(s0)
|
|
80000e20: 00e7a223 sw a4,4(a5)
|
|
80000e24: 810037b7 lui a5,0x81003
|
|
80000e28: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000e2c: fd442703 lw a4,-44(s0)
|
|
80000e30: 00e7a423 sw a4,8(a5)
|
|
80000e34: 810037b7 lui a5,0x81003
|
|
80000e38: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000e3c: fcc42703 lw a4,-52(s0)
|
|
80000e40: 00e7a623 sw a4,12(a5)
|
|
80000e44: 810037b7 lui a5,0x81003
|
|
80000e48: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000e4c: fd042703 lw a4,-48(s0)
|
|
80000e50: 00e7a823 sw a4,16(a5)
|
|
80000e54: b70ff0ef jal ra,800001c4 <vx_available_threads>
|
|
80000e58: fea42423 sw a0,-24(s0)
|
|
80000e5c: fcc42703 lw a4,-52(s0)
|
|
80000e60: fe842783 lw a5,-24(s0)
|
|
80000e64: 02f757b3 divu a5,a4,a5
|
|
80000e68: fef42623 sw a5,-20(s0)
|
|
80000e6c: fcc42703 lw a4,-52(s0)
|
|
80000e70: fe842783 lw a5,-24(s0)
|
|
80000e74: 02f777b3 remu a5,a4,a5
|
|
80000e78: 00078863 beqz a5,80000e88 <vx_mat_sub+0xa4>
|
|
80000e7c: fec42783 lw a5,-20(s0)
|
|
80000e80: 00178793 addi a5,a5,1
|
|
80000e84: fef42623 sw a5,-20(s0)
|
|
80000e88: 810037b7 lui a5,0x81003
|
|
80000e8c: 97078793 addi a5,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000e90: fec42703 lw a4,-20(s0)
|
|
80000e94: 00e7aa23 sw a4,20(a5)
|
|
80000e98: fcc42703 lw a4,-52(s0)
|
|
80000e9c: fe842783 lw a5,-24(s0)
|
|
80000ea0: 02f76263 bltu a4,a5,80000ec4 <vx_mat_sub+0xe0>
|
|
80000ea4: 810037b7 lui a5,0x81003
|
|
80000ea8: 97078693 addi a3,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000eac: 800017b7 lui a5,0x80001
|
|
80000eb0: f1c78613 addi a2,a5,-228 # 80000f1c <main_sp+0xfeffb560>
|
|
80000eb4: fe842583 lw a1,-24(s0)
|
|
80000eb8: fd042503 lw a0,-48(s0)
|
|
80000ebc: d68ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80000ec0: 0200006f j 80000ee0 <vx_mat_sub+0xfc>
|
|
80000ec4: 810037b7 lui a5,0x81003
|
|
80000ec8: 97078693 addi a3,a5,-1680 # 81002970 <main_sp+0xffffcfb4>
|
|
80000ecc: 800017b7 lui a5,0x80001
|
|
80000ed0: f1c78613 addi a2,a5,-228 # 80000f1c <main_sp+0xfeffb560>
|
|
80000ed4: fcc42583 lw a1,-52(s0)
|
|
80000ed8: fd042503 lw a0,-48(s0)
|
|
80000edc: d48ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80000ee0: adcff0ef jal ra,800001bc <vx_available_warps>
|
|
80000ee4: fea42223 sw a0,-28(s0)
|
|
80000ee8: fd042703 lw a4,-48(s0)
|
|
80000eec: fe442783 lw a5,-28(s0)
|
|
80000ef0: 00e7f863 bgeu a5,a4,80000f00 <vx_mat_sub+0x11c>
|
|
80000ef4: fe442503 lw a0,-28(s0)
|
|
80000ef8: e18ff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
80000efc: 00c0006f j 80000f08 <vx_mat_sub+0x124>
|
|
80000f00: fd042503 lw a0,-48(s0)
|
|
80000f04: e0cff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
80000f08: 00000013 nop
|
|
80000f0c: 03c12083 lw ra,60(sp)
|
|
80000f10: 03812403 lw s0,56(sp)
|
|
80000f14: 04010113 addi sp,sp,64
|
|
80000f18: 00008067 ret
|
|
|
|
80000f1c <_vx_mat_sub>:
|
|
80000f1c: fb010113 addi sp,sp,-80
|
|
80000f20: 04112623 sw ra,76(sp)
|
|
80000f24: 04812423 sw s0,72(sp)
|
|
80000f28: 05010413 addi s0,sp,80
|
|
80000f2c: faa42e23 sw a0,-68(s0)
|
|
80000f30: fab42c23 sw a1,-72(s0)
|
|
80000f34: ea8ff0ef jal ra,800005dc <vx_get_arg_struct>
|
|
80000f38: fea42023 sw a0,-32(s0)
|
|
80000f3c: fe042783 lw a5,-32(s0)
|
|
80000f40: 0007a783 lw a5,0(a5)
|
|
80000f44: fcf42e23 sw a5,-36(s0)
|
|
80000f48: fe042783 lw a5,-32(s0)
|
|
80000f4c: 0047a783 lw a5,4(a5)
|
|
80000f50: fcf42c23 sw a5,-40(s0)
|
|
80000f54: fe042783 lw a5,-32(s0)
|
|
80000f58: 0087a783 lw a5,8(a5)
|
|
80000f5c: fcf42a23 sw a5,-44(s0)
|
|
80000f60: fe042783 lw a5,-32(s0)
|
|
80000f64: 0147a783 lw a5,20(a5)
|
|
80000f68: fef42623 sw a5,-20(s0)
|
|
80000f6c: fec42703 lw a4,-20(s0)
|
|
80000f70: fbc42783 lw a5,-68(s0)
|
|
80000f74: 02f707b3 mul a5,a4,a5
|
|
80000f78: fef42423 sw a5,-24(s0)
|
|
80000f7c: fec42783 lw a5,-20(s0)
|
|
80000f80: 00079a63 bnez a5,80000f94 <_vx_mat_sub+0x78>
|
|
80000f84: 00100793 li a5,1
|
|
80000f88: fef42623 sw a5,-20(s0)
|
|
80000f8c: fbc42783 lw a5,-68(s0)
|
|
80000f90: fef42423 sw a5,-24(s0)
|
|
80000f94: fe042783 lw a5,-32(s0)
|
|
80000f98: 00c7a783 lw a5,12(a5)
|
|
80000f9c: fcf42823 sw a5,-48(s0)
|
|
80000fa0: fe042223 sw zero,-28(s0)
|
|
80000fa4: 0c00006f j 80001064 <_vx_mat_sub+0x148>
|
|
80000fa8: fb842703 lw a4,-72(s0)
|
|
80000fac: fd042783 lw a5,-48(s0)
|
|
80000fb0: 02f70733 mul a4,a4,a5
|
|
80000fb4: fe842783 lw a5,-24(s0)
|
|
80000fb8: 00f707b3 add a5,a4,a5
|
|
80000fbc: fcf42623 sw a5,-52(s0)
|
|
80000fc0: fe842703 lw a4,-24(s0)
|
|
80000fc4: fd042783 lw a5,-48(s0)
|
|
80000fc8: 00f737b3 sltu a5,a4,a5
|
|
80000fcc: 0ff7f793 andi a5,a5,255
|
|
80000fd0: fcf42423 sw a5,-56(s0)
|
|
80000fd4: fc842783 lw a5,-56(s0)
|
|
80000fd8: 0017b793 seqz a5,a5
|
|
80000fdc: fcf403a3 sb a5,-57(s0)
|
|
80000fe0: fc744783 lbu a5,-57(s0)
|
|
80000fe4: 00078f13 mv t5,a5
|
|
80000fe8: 800017b7 lui a5,0x80001
|
|
80000fec: 05078f93 addi t6,a5,80 # 80001050 <main_sp+0xfeffb694>
|
|
80000ff0: 000f206b 0xf206b
|
|
80000ff4: 01ff707b 0x1ff707b
|
|
80000ff8: fcc42783 lw a5,-52(s0)
|
|
80000ffc: 00279793 slli a5,a5,0x2
|
|
80001000: fdc42703 lw a4,-36(s0)
|
|
80001004: 00f707b3 add a5,a4,a5
|
|
80001008: 0007a683 lw a3,0(a5)
|
|
8000100c: fcc42783 lw a5,-52(s0)
|
|
80001010: 00279793 slli a5,a5,0x2
|
|
80001014: fd842703 lw a4,-40(s0)
|
|
80001018: 00f707b3 add a5,a4,a5
|
|
8000101c: 0007a703 lw a4,0(a5)
|
|
80001020: fcc42783 lw a5,-52(s0)
|
|
80001024: 00279793 slli a5,a5,0x2
|
|
80001028: fd442603 lw a2,-44(s0)
|
|
8000102c: 00f607b3 add a5,a2,a5
|
|
80001030: 40e68733 sub a4,a3,a4
|
|
80001034: 00e7a023 sw a4,0(a5)
|
|
80001038: fe842783 lw a5,-24(s0)
|
|
8000103c: 00178793 addi a5,a5,1
|
|
80001040: fef42423 sw a5,-24(s0)
|
|
80001044: 800017b7 lui a5,0x80001
|
|
80001048: 05478e13 addi t3,a5,84 # 80001054 <main_sp+0xfeffb698>
|
|
8000104c: 000e0067 jr t3
|
|
80001050: 00000013 nop
|
|
80001054: 0000306b 0x306b
|
|
80001058: fe442783 lw a5,-28(s0)
|
|
8000105c: 00178793 addi a5,a5,1
|
|
80001060: fef42223 sw a5,-28(s0)
|
|
80001064: fe442783 lw a5,-28(s0)
|
|
80001068: fec42703 lw a4,-20(s0)
|
|
8000106c: f2e7eee3 bltu a5,a4,80000fa8 <_vx_mat_sub+0x8c>
|
|
80001070: 00000013 nop
|
|
80001074: 04c12083 lw ra,76(sp)
|
|
80001078: 04812403 lw s0,72(sp)
|
|
8000107c: 05010113 addi sp,sp,80
|
|
80001080: 00008067 ret
|
|
|
|
80001084 <vx_e_mat_add>:
|
|
80001084: fc010113 addi sp,sp,-64
|
|
80001088: 02112e23 sw ra,60(sp)
|
|
8000108c: 02812c23 sw s0,56(sp)
|
|
80001090: 04010413 addi s0,sp,64
|
|
80001094: fca42e23 sw a0,-36(s0)
|
|
80001098: fcb42c23 sw a1,-40(s0)
|
|
8000109c: fcc42a23 sw a2,-44(s0)
|
|
800010a0: fcd42823 sw a3,-48(s0)
|
|
800010a4: fce42623 sw a4,-52(s0)
|
|
800010a8: 810037b7 lui a5,0x81003
|
|
800010ac: fdc42703 lw a4,-36(s0)
|
|
800010b0: 98e7a423 sw a4,-1656(a5) # 81002988 <main_sp+0xffffcfcc>
|
|
800010b4: 810037b7 lui a5,0x81003
|
|
800010b8: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
800010bc: fd842703 lw a4,-40(s0)
|
|
800010c0: 00e7a223 sw a4,4(a5)
|
|
800010c4: 810037b7 lui a5,0x81003
|
|
800010c8: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
800010cc: fd442703 lw a4,-44(s0)
|
|
800010d0: 00e7a423 sw a4,8(a5)
|
|
800010d4: 810037b7 lui a5,0x81003
|
|
800010d8: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
800010dc: fcc42703 lw a4,-52(s0)
|
|
800010e0: 00e7a623 sw a4,12(a5)
|
|
800010e4: 810037b7 lui a5,0x81003
|
|
800010e8: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
800010ec: fd042703 lw a4,-48(s0)
|
|
800010f0: 00e7a823 sw a4,16(a5)
|
|
800010f4: 8d0ff0ef jal ra,800001c4 <vx_available_threads>
|
|
800010f8: fea42423 sw a0,-24(s0)
|
|
800010fc: fcc42703 lw a4,-52(s0)
|
|
80001100: fe842783 lw a5,-24(s0)
|
|
80001104: 02f757b3 divu a5,a4,a5
|
|
80001108: fef42623 sw a5,-20(s0)
|
|
8000110c: fcc42703 lw a4,-52(s0)
|
|
80001110: fe842783 lw a5,-24(s0)
|
|
80001114: 02f777b3 remu a5,a4,a5
|
|
80001118: 00078863 beqz a5,80001128 <vx_e_mat_add+0xa4>
|
|
8000111c: fec42783 lw a5,-20(s0)
|
|
80001120: 00178793 addi a5,a5,1
|
|
80001124: fef42623 sw a5,-20(s0)
|
|
80001128: 810037b7 lui a5,0x81003
|
|
8000112c: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
80001130: fec42703 lw a4,-20(s0)
|
|
80001134: 00e7aa23 sw a4,20(a5)
|
|
80001138: fcc42703 lw a4,-52(s0)
|
|
8000113c: fe842783 lw a5,-24(s0)
|
|
80001140: 02f76263 bltu a4,a5,80001164 <vx_e_mat_add+0xe0>
|
|
80001144: 810037b7 lui a5,0x81003
|
|
80001148: 98878693 addi a3,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
8000114c: 800017b7 lui a5,0x80001
|
|
80001150: 1bc78613 addi a2,a5,444 # 800011bc <main_sp+0xfeffb800>
|
|
80001154: fe842583 lw a1,-24(s0)
|
|
80001158: fd042503 lw a0,-48(s0)
|
|
8000115c: ac8ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80001160: 0200006f j 80001180 <vx_e_mat_add+0xfc>
|
|
80001164: 810037b7 lui a5,0x81003
|
|
80001168: 98878693 addi a3,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
8000116c: 800017b7 lui a5,0x80001
|
|
80001170: 1bc78613 addi a2,a5,444 # 800011bc <main_sp+0xfeffb800>
|
|
80001174: fcc42583 lw a1,-52(s0)
|
|
80001178: fd042503 lw a0,-48(s0)
|
|
8000117c: aa8ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80001180: 83cff0ef jal ra,800001bc <vx_available_warps>
|
|
80001184: fea42223 sw a0,-28(s0)
|
|
80001188: fd042703 lw a4,-48(s0)
|
|
8000118c: fe442783 lw a5,-28(s0)
|
|
80001190: 00e7f863 bgeu a5,a4,800011a0 <vx_e_mat_add+0x11c>
|
|
80001194: fe442503 lw a0,-28(s0)
|
|
80001198: b78ff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
8000119c: 00c0006f j 800011a8 <vx_e_mat_add+0x124>
|
|
800011a0: fd042503 lw a0,-48(s0)
|
|
800011a4: b6cff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
800011a8: 00000013 nop
|
|
800011ac: 03c12083 lw ra,60(sp)
|
|
800011b0: 03812403 lw s0,56(sp)
|
|
800011b4: 04010113 addi sp,sp,64
|
|
800011b8: 00008067 ret
|
|
|
|
800011bc <_vx_e_mat_add>:
|
|
800011bc: fb010113 addi sp,sp,-80
|
|
800011c0: 04112623 sw ra,76(sp)
|
|
800011c4: 04812423 sw s0,72(sp)
|
|
800011c8: 05010413 addi s0,sp,80
|
|
800011cc: faa42e23 sw a0,-68(s0)
|
|
800011d0: fab42c23 sw a1,-72(s0)
|
|
800011d4: c08ff0ef jal ra,800005dc <vx_get_arg_struct>
|
|
800011d8: fea42023 sw a0,-32(s0)
|
|
800011dc: fe042783 lw a5,-32(s0)
|
|
800011e0: 0007a783 lw a5,0(a5)
|
|
800011e4: fcf42e23 sw a5,-36(s0)
|
|
800011e8: fe042783 lw a5,-32(s0)
|
|
800011ec: 0047a783 lw a5,4(a5)
|
|
800011f0: 0007a783 lw a5,0(a5)
|
|
800011f4: fcf42c23 sw a5,-40(s0)
|
|
800011f8: fe042783 lw a5,-32(s0)
|
|
800011fc: 0087a783 lw a5,8(a5)
|
|
80001200: fcf42a23 sw a5,-44(s0)
|
|
80001204: fe042783 lw a5,-32(s0)
|
|
80001208: 0147a783 lw a5,20(a5)
|
|
8000120c: fef42623 sw a5,-20(s0)
|
|
80001210: fec42703 lw a4,-20(s0)
|
|
80001214: fbc42783 lw a5,-68(s0)
|
|
80001218: 02f707b3 mul a5,a4,a5
|
|
8000121c: fef42423 sw a5,-24(s0)
|
|
80001220: fec42783 lw a5,-20(s0)
|
|
80001224: 00079a63 bnez a5,80001238 <_vx_e_mat_add+0x7c>
|
|
80001228: 00100793 li a5,1
|
|
8000122c: fef42623 sw a5,-20(s0)
|
|
80001230: fbc42783 lw a5,-68(s0)
|
|
80001234: fef42423 sw a5,-24(s0)
|
|
80001238: fe042783 lw a5,-32(s0)
|
|
8000123c: 00c7a783 lw a5,12(a5)
|
|
80001240: fcf42823 sw a5,-48(s0)
|
|
80001244: fe042223 sw zero,-28(s0)
|
|
80001248: 0b00006f j 800012f8 <_vx_e_mat_add+0x13c>
|
|
8000124c: fb842703 lw a4,-72(s0)
|
|
80001250: fd042783 lw a5,-48(s0)
|
|
80001254: 02f70733 mul a4,a4,a5
|
|
80001258: fe842783 lw a5,-24(s0)
|
|
8000125c: 00f707b3 add a5,a4,a5
|
|
80001260: fcf42623 sw a5,-52(s0)
|
|
80001264: fe842703 lw a4,-24(s0)
|
|
80001268: fd042783 lw a5,-48(s0)
|
|
8000126c: 00f737b3 sltu a5,a4,a5
|
|
80001270: 0ff7f793 andi a5,a5,255
|
|
80001274: fcf42423 sw a5,-56(s0)
|
|
80001278: fc842783 lw a5,-56(s0)
|
|
8000127c: 0017b793 seqz a5,a5
|
|
80001280: fcf403a3 sb a5,-57(s0)
|
|
80001284: fc744783 lbu a5,-57(s0)
|
|
80001288: 00078f13 mv t5,a5
|
|
8000128c: 800017b7 lui a5,0x80001
|
|
80001290: 2e478f93 addi t6,a5,740 # 800012e4 <main_sp+0xfeffb928>
|
|
80001294: 000f206b 0xf206b
|
|
80001298: 01ff707b 0x1ff707b
|
|
8000129c: fcc42783 lw a5,-52(s0)
|
|
800012a0: 00279793 slli a5,a5,0x2
|
|
800012a4: fdc42703 lw a4,-36(s0)
|
|
800012a8: 00f707b3 add a5,a4,a5
|
|
800012ac: 0007a683 lw a3,0(a5)
|
|
800012b0: fcc42783 lw a5,-52(s0)
|
|
800012b4: 00279793 slli a5,a5,0x2
|
|
800012b8: fd442703 lw a4,-44(s0)
|
|
800012bc: 00f707b3 add a5,a4,a5
|
|
800012c0: fd842703 lw a4,-40(s0)
|
|
800012c4: 00e68733 add a4,a3,a4
|
|
800012c8: 00e7a023 sw a4,0(a5)
|
|
800012cc: fe842783 lw a5,-24(s0)
|
|
800012d0: 00178793 addi a5,a5,1
|
|
800012d4: fef42423 sw a5,-24(s0)
|
|
800012d8: 800017b7 lui a5,0x80001
|
|
800012dc: 2e878e13 addi t3,a5,744 # 800012e8 <main_sp+0xfeffb92c>
|
|
800012e0: 000e0067 jr t3
|
|
800012e4: 00000013 nop
|
|
800012e8: 0000306b 0x306b
|
|
800012ec: fe442783 lw a5,-28(s0)
|
|
800012f0: 00178793 addi a5,a5,1
|
|
800012f4: fef42223 sw a5,-28(s0)
|
|
800012f8: fe442783 lw a5,-28(s0)
|
|
800012fc: fec42703 lw a4,-20(s0)
|
|
80001300: f4e7e6e3 bltu a5,a4,8000124c <_vx_e_mat_add+0x90>
|
|
80001304: 00000013 nop
|
|
80001308: 04c12083 lw ra,76(sp)
|
|
8000130c: 04812403 lw s0,72(sp)
|
|
80001310: 05010113 addi sp,sp,80
|
|
80001314: 00008067 ret
|
|
|
|
80001318 <vx_e_mat_mult>:
|
|
80001318: fc010113 addi sp,sp,-64
|
|
8000131c: 02112e23 sw ra,60(sp)
|
|
80001320: 02812c23 sw s0,56(sp)
|
|
80001324: 04010413 addi s0,sp,64
|
|
80001328: fca42e23 sw a0,-36(s0)
|
|
8000132c: fcb42c23 sw a1,-40(s0)
|
|
80001330: fcc42a23 sw a2,-44(s0)
|
|
80001334: fcd42823 sw a3,-48(s0)
|
|
80001338: fce42623 sw a4,-52(s0)
|
|
8000133c: 810037b7 lui a5,0x81003
|
|
80001340: fdc42703 lw a4,-36(s0)
|
|
80001344: 98e7a423 sw a4,-1656(a5) # 81002988 <main_sp+0xffffcfcc>
|
|
80001348: 810037b7 lui a5,0x81003
|
|
8000134c: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
80001350: fd842703 lw a4,-40(s0)
|
|
80001354: 00e7a223 sw a4,4(a5)
|
|
80001358: 810037b7 lui a5,0x81003
|
|
8000135c: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
80001360: fd442703 lw a4,-44(s0)
|
|
80001364: 00e7a423 sw a4,8(a5)
|
|
80001368: 810037b7 lui a5,0x81003
|
|
8000136c: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
80001370: fcc42703 lw a4,-52(s0)
|
|
80001374: 00e7a623 sw a4,12(a5)
|
|
80001378: 810037b7 lui a5,0x81003
|
|
8000137c: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
80001380: fd042703 lw a4,-48(s0)
|
|
80001384: 00e7a823 sw a4,16(a5)
|
|
80001388: e3dfe0ef jal ra,800001c4 <vx_available_threads>
|
|
8000138c: fea42423 sw a0,-24(s0)
|
|
80001390: fcc42703 lw a4,-52(s0)
|
|
80001394: fe842783 lw a5,-24(s0)
|
|
80001398: 02f757b3 divu a5,a4,a5
|
|
8000139c: fef42623 sw a5,-20(s0)
|
|
800013a0: fcc42703 lw a4,-52(s0)
|
|
800013a4: fe842783 lw a5,-24(s0)
|
|
800013a8: 02f777b3 remu a5,a4,a5
|
|
800013ac: 00078863 beqz a5,800013bc <vx_e_mat_mult+0xa4>
|
|
800013b0: fec42783 lw a5,-20(s0)
|
|
800013b4: 00178793 addi a5,a5,1
|
|
800013b8: fef42623 sw a5,-20(s0)
|
|
800013bc: 810037b7 lui a5,0x81003
|
|
800013c0: 98878793 addi a5,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
800013c4: fec42703 lw a4,-20(s0)
|
|
800013c8: 00e7aa23 sw a4,20(a5)
|
|
800013cc: fcc42703 lw a4,-52(s0)
|
|
800013d0: fe842783 lw a5,-24(s0)
|
|
800013d4: 02f76263 bltu a4,a5,800013f8 <vx_e_mat_mult+0xe0>
|
|
800013d8: 810037b7 lui a5,0x81003
|
|
800013dc: 98878693 addi a3,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
800013e0: 800017b7 lui a5,0x80001
|
|
800013e4: 45078613 addi a2,a5,1104 # 80001450 <main_sp+0xfeffba94>
|
|
800013e8: fe842583 lw a1,-24(s0)
|
|
800013ec: fd042503 lw a0,-48(s0)
|
|
800013f0: 834ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
800013f4: 0200006f j 80001414 <vx_e_mat_mult+0xfc>
|
|
800013f8: 810037b7 lui a5,0x81003
|
|
800013fc: 98878693 addi a3,a5,-1656 # 81002988 <main_sp+0xffffcfcc>
|
|
80001400: 800017b7 lui a5,0x80001
|
|
80001404: 45078613 addi a2,a5,1104 # 80001450 <main_sp+0xfeffba94>
|
|
80001408: fcc42583 lw a1,-52(s0)
|
|
8000140c: fd042503 lw a0,-48(s0)
|
|
80001410: 814ff0ef jal ra,80000424 <vx_spawnWarps>
|
|
80001414: da9fe0ef jal ra,800001bc <vx_available_warps>
|
|
80001418: fea42223 sw a0,-28(s0)
|
|
8000141c: fd042703 lw a4,-48(s0)
|
|
80001420: fe442783 lw a5,-28(s0)
|
|
80001424: 00e7f863 bgeu a5,a4,80001434 <vx_e_mat_mult+0x11c>
|
|
80001428: fe442503 lw a0,-28(s0)
|
|
8000142c: 8e4ff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
80001430: 00c0006f j 8000143c <vx_e_mat_mult+0x124>
|
|
80001434: fd042503 lw a0,-48(s0)
|
|
80001438: 8d8ff0ef jal ra,80000510 <vx_wait_for_warps>
|
|
8000143c: 00000013 nop
|
|
80001440: 03c12083 lw ra,60(sp)
|
|
80001444: 03812403 lw s0,56(sp)
|
|
80001448: 04010113 addi sp,sp,64
|
|
8000144c: 00008067 ret
|
|
|
|
80001450 <_vx_e_mat_mult>:
|
|
80001450: fb010113 addi sp,sp,-80
|
|
80001454: 04112623 sw ra,76(sp)
|
|
80001458: 04812423 sw s0,72(sp)
|
|
8000145c: 05010413 addi s0,sp,80
|
|
80001460: faa42e23 sw a0,-68(s0)
|
|
80001464: fab42c23 sw a1,-72(s0)
|
|
80001468: 974ff0ef jal ra,800005dc <vx_get_arg_struct>
|
|
8000146c: fea42023 sw a0,-32(s0)
|
|
80001470: fe042783 lw a5,-32(s0)
|
|
80001474: 0007a783 lw a5,0(a5)
|
|
80001478: fcf42e23 sw a5,-36(s0)
|
|
8000147c: fe042783 lw a5,-32(s0)
|
|
80001480: 0047a783 lw a5,4(a5)
|
|
80001484: 0007a783 lw a5,0(a5)
|
|
80001488: fcf42c23 sw a5,-40(s0)
|
|
8000148c: fe042783 lw a5,-32(s0)
|
|
80001490: 0087a783 lw a5,8(a5)
|
|
80001494: fcf42a23 sw a5,-44(s0)
|
|
80001498: fe042783 lw a5,-32(s0)
|
|
8000149c: 0147a783 lw a5,20(a5)
|
|
800014a0: fef42623 sw a5,-20(s0)
|
|
800014a4: fec42703 lw a4,-20(s0)
|
|
800014a8: fbc42783 lw a5,-68(s0)
|
|
800014ac: 02f707b3 mul a5,a4,a5
|
|
800014b0: fef42423 sw a5,-24(s0)
|
|
800014b4: fec42783 lw a5,-20(s0)
|
|
800014b8: 00079a63 bnez a5,800014cc <_vx_e_mat_mult+0x7c>
|
|
800014bc: 00100793 li a5,1
|
|
800014c0: fef42623 sw a5,-20(s0)
|
|
800014c4: fbc42783 lw a5,-68(s0)
|
|
800014c8: fef42423 sw a5,-24(s0)
|
|
800014cc: fe042783 lw a5,-32(s0)
|
|
800014d0: 00c7a783 lw a5,12(a5)
|
|
800014d4: fcf42823 sw a5,-48(s0)
|
|
800014d8: fe042223 sw zero,-28(s0)
|
|
800014dc: 0b00006f j 8000158c <_vx_e_mat_mult+0x13c>
|
|
800014e0: fb842703 lw a4,-72(s0)
|
|
800014e4: fd042783 lw a5,-48(s0)
|
|
800014e8: 02f70733 mul a4,a4,a5
|
|
800014ec: fe842783 lw a5,-24(s0)
|
|
800014f0: 00f707b3 add a5,a4,a5
|
|
800014f4: fcf42623 sw a5,-52(s0)
|
|
800014f8: fe842703 lw a4,-24(s0)
|
|
800014fc: fd042783 lw a5,-48(s0)
|
|
80001500: 00f737b3 sltu a5,a4,a5
|
|
80001504: 0ff7f793 andi a5,a5,255
|
|
80001508: fcf42423 sw a5,-56(s0)
|
|
8000150c: fc842783 lw a5,-56(s0)
|
|
80001510: 0017b793 seqz a5,a5
|
|
80001514: fcf403a3 sb a5,-57(s0)
|
|
80001518: fc744783 lbu a5,-57(s0)
|
|
8000151c: 00078f13 mv t5,a5
|
|
80001520: 800017b7 lui a5,0x80001
|
|
80001524: 57878f93 addi t6,a5,1400 # 80001578 <main_sp+0xfeffbbbc>
|
|
80001528: 000f206b 0xf206b
|
|
8000152c: 01ff707b 0x1ff707b
|
|
80001530: fcc42783 lw a5,-52(s0)
|
|
80001534: 00279793 slli a5,a5,0x2
|
|
80001538: fdc42703 lw a4,-36(s0)
|
|
8000153c: 00f707b3 add a5,a4,a5
|
|
80001540: 0007a683 lw a3,0(a5)
|
|
80001544: fcc42783 lw a5,-52(s0)
|
|
80001548: 00279793 slli a5,a5,0x2
|
|
8000154c: fd442703 lw a4,-44(s0)
|
|
80001550: 00f707b3 add a5,a4,a5
|
|
80001554: fd842703 lw a4,-40(s0)
|
|
80001558: 02e68733 mul a4,a3,a4
|
|
8000155c: 00e7a023 sw a4,0(a5)
|
|
80001560: fe842783 lw a5,-24(s0)
|
|
80001564: 00178793 addi a5,a5,1
|
|
80001568: fef42423 sw a5,-24(s0)
|
|
8000156c: 800017b7 lui a5,0x80001
|
|
80001570: 57c78e13 addi t3,a5,1404 # 8000157c <main_sp+0xfeffbbc0>
|
|
80001574: 000e0067 jr t3
|
|
80001578: 00000013 nop
|
|
8000157c: 0000306b 0x306b
|
|
80001580: fe442783 lw a5,-28(s0)
|
|
80001584: 00178793 addi a5,a5,1
|
|
80001588: fef42223 sw a5,-28(s0)
|
|
8000158c: fe442783 lw a5,-28(s0)
|
|
80001590: fec42703 lw a4,-20(s0)
|
|
80001594: f4e7e6e3 bltu a5,a4,800014e0 <_vx_e_mat_mult+0x90>
|
|
80001598: 00000013 nop
|
|
8000159c: 04c12083 lw ra,76(sp)
|
|
800015a0: 04812403 lw s0,72(sp)
|
|
800015a4: 05010113 addi sp,sp,80
|
|
800015a8: 00008067 ret
|
|
|
|
800015ac <initialize_mats>:
|
|
800015ac: fe010113 addi sp,sp,-32
|
|
800015b0: 00812e23 sw s0,28(sp)
|
|
800015b4: 02010413 addi s0,sp,32
|
|
800015b8: fe042623 sw zero,-20(s0)
|
|
800015bc: 0480006f j 80001604 <initialize_mats+0x58>
|
|
800015c0: 810037b7 lui a5,0x81003
|
|
800015c4: fec42703 lw a4,-20(s0)
|
|
800015c8: 00271713 slli a4,a4,0x2
|
|
800015cc: 9a078793 addi a5,a5,-1632 # 810029a0 <main_sp+0xffffcfe4>
|
|
800015d0: 00f707b3 add a5,a4,a5
|
|
800015d4: 00300713 li a4,3
|
|
800015d8: 00e7a023 sw a4,0(a5)
|
|
800015dc: 810047b7 lui a5,0x81004
|
|
800015e0: fec42703 lw a4,-20(s0)
|
|
800015e4: 00271713 slli a4,a4,0x2
|
|
800015e8: 9a078793 addi a5,a5,-1632 # 810039a0 <main_sp+0xffffdfe4>
|
|
800015ec: 00f707b3 add a5,a4,a5
|
|
800015f0: 00200713 li a4,2
|
|
800015f4: 00e7a023 sw a4,0(a5)
|
|
800015f8: fec42783 lw a5,-20(s0)
|
|
800015fc: 00178793 addi a5,a5,1
|
|
80001600: fef42623 sw a5,-20(s0)
|
|
80001604: fec42703 lw a4,-20(s0)
|
|
80001608: 0ff00793 li a5,255
|
|
8000160c: fae7dae3 bge a5,a4,800015c0 <initialize_mats+0x14>
|
|
80001610: 00000013 nop
|
|
80001614: 01c12403 lw s0,28(sp)
|
|
80001618: 02010113 addi sp,sp,32
|
|
8000161c: 00008067 ret
|
|
|
|
80001620 <print_matrix>:
|
|
80001620: fd010113 addi sp,sp,-48
|
|
80001624: 02112623 sw ra,44(sp)
|
|
80001628: 02812423 sw s0,40(sp)
|
|
8000162c: 03010413 addi s0,sp,48
|
|
80001630: fca42e23 sw a0,-36(s0)
|
|
80001634: 810007b7 lui a5,0x81000
|
|
80001638: 11078513 addi a0,a5,272 # 81000110 <main_sp+0xffffa754>
|
|
8000163c: 90cff0ef jal ra,80000748 <vx_print_str>
|
|
80001640: fe042623 sw zero,-20(s0)
|
|
80001644: 0580006f j 8000169c <print_matrix+0x7c>
|
|
80001648: fec42783 lw a5,-20(s0)
|
|
8000164c: 00078e63 beqz a5,80001668 <print_matrix+0x48>
|
|
80001650: fec42783 lw a5,-20(s0)
|
|
80001654: 00f7f793 andi a5,a5,15
|
|
80001658: 00079863 bnez a5,80001668 <print_matrix+0x48>
|
|
8000165c: 810007b7 lui a5,0x81000
|
|
80001660: 13478513 addi a0,a5,308 # 81000134 <main_sp+0xffffa778>
|
|
80001664: 8e4ff0ef jal ra,80000748 <vx_print_str>
|
|
80001668: fec42783 lw a5,-20(s0)
|
|
8000166c: 00279793 slli a5,a5,0x2
|
|
80001670: fdc42703 lw a4,-36(s0)
|
|
80001674: 00f707b3 add a5,a4,a5
|
|
80001678: 0007a783 lw a5,0(a5)
|
|
8000167c: 00078513 mv a0,a5
|
|
80001680: 904ff0ef jal ra,80000784 <vx_print_hex>
|
|
80001684: 810007b7 lui a5,0x81000
|
|
80001688: 13878513 addi a0,a5,312 # 81000138 <main_sp+0xffffa77c>
|
|
8000168c: 8bcff0ef jal ra,80000748 <vx_print_str>
|
|
80001690: fec42783 lw a5,-20(s0)
|
|
80001694: 00178793 addi a5,a5,1
|
|
80001698: fef42623 sw a5,-20(s0)
|
|
8000169c: fec42703 lw a4,-20(s0)
|
|
800016a0: 0ff00793 li a5,255
|
|
800016a4: fae7d2e3 bge a5,a4,80001648 <print_matrix+0x28>
|
|
800016a8: 810007b7 lui a5,0x81000
|
|
800016ac: 13c78513 addi a0,a5,316 # 8100013c <main_sp+0xffffa780>
|
|
800016b0: 898ff0ef jal ra,80000748 <vx_print_str>
|
|
800016b4: 00000013 nop
|
|
800016b8: 02c12083 lw ra,44(sp)
|
|
800016bc: 02812403 lw s0,40(sp)
|
|
800016c0: 03010113 addi sp,sp,48
|
|
800016c4: 00008067 ret
|
|
|
|
800016c8 <main>:
|
|
800016c8: ff010113 addi sp,sp,-16
|
|
800016cc: 00112623 sw ra,12(sp)
|
|
800016d0: 00812423 sw s0,8(sp)
|
|
800016d4: 01010413 addi s0,sp,16
|
|
800016d8: ed5ff0ef jal ra,800015ac <initialize_mats>
|
|
800016dc: 01000693 li a3,16
|
|
800016e0: 810057b7 lui a5,0x81005
|
|
800016e4: 9a078613 addi a2,a5,-1632 # 810049a0 <main_sp+0xffffefe4>
|
|
800016e8: 810047b7 lui a5,0x81004
|
|
800016ec: 9a078593 addi a1,a5,-1632 # 810039a0 <main_sp+0xffffdfe4>
|
|
800016f0: 810037b7 lui a5,0x81003
|
|
800016f4: 9a078513 addi a0,a5,-1632 # 810029a0 <main_sp+0xffffcfe4>
|
|
800016f8: 998ff0ef jal ra,80000890 <vx_sq_mat_mult>
|
|
800016fc: 810007b7 lui a5,0x81000
|
|
80001700: 16078513 addi a0,a5,352 # 81000160 <main_sp+0xffffa7a4>
|
|
80001704: 844ff0ef jal ra,80000748 <vx_print_str>
|
|
80001708: 810057b7 lui a5,0x81005
|
|
8000170c: 9a078513 addi a0,a5,-1632 # 810049a0 <main_sp+0xffffefe4>
|
|
80001710: f11ff0ef jal ra,80001620 <print_matrix>
|
|
80001714: 00000793 li a5,0
|
|
80001718: 00078513 mv a0,a5
|
|
8000171c: 00c12083 lw ra,12(sp)
|
|
80001720: 00812403 lw s0,8(sp)
|
|
80001724: 01010113 addi sp,sp,16
|
|
80001728: 00008067 ret
|
|
|
|
Disassembly of section .rodata:
|
|
|
|
81000000 <.rodata>:
|
|
81000000: 0030 addi a2,sp,8
|
|
81000002: 0000 unimp
|
|
81000004: 0031 c.nop 12
|
|
81000006: 0000 unimp
|
|
81000008: 0032 c.slli zero,0xc
|
|
8100000a: 0000 unimp
|
|
8100000c: 00000033 add zero,zero,zero
|
|
81000010: 0034 addi a3,sp,8
|
|
81000012: 0000 unimp
|
|
81000014: 0035 c.nop 13
|
|
81000016: 0000 unimp
|
|
81000018: 0036 c.slli zero,0xd
|
|
8100001a: 0000 unimp
|
|
8100001c: 00000037 lui zero,0x0
|
|
81000020: 0038 addi a4,sp,8
|
|
81000022: 0000 unimp
|
|
81000024: 0039 c.nop 14
|
|
81000026: 0000 unimp
|
|
81000028: 0061 c.nop 24
|
|
8100002a: 0000 unimp
|
|
8100002c: 0062 c.slli zero,0x18
|
|
8100002e: 0000 unimp
|
|
81000030: 00000063 beqz zero,81000030 <main+0xffe968>
|
|
81000034: 0064 addi s1,sp,12
|
|
81000036: 0000 unimp
|
|
81000038: 0065 c.nop 25
|
|
8100003a: 0000 unimp
|
|
8100003c: 0066 c.slli zero,0x19
|
|
8100003e: 0000 unimp
|
|
81000040: 0030 addi a2,sp,8
|
|
81000042: 0000 unimp
|
|
81000044: 0031 c.nop 12
|
|
81000046: 0000 unimp
|
|
81000048: 0032 c.slli zero,0xc
|
|
8100004a: 0000 unimp
|
|
8100004c: 00000033 add zero,zero,zero
|
|
81000050: 0034 addi a3,sp,8
|
|
81000052: 0000 unimp
|
|
81000054: 0035 c.nop 13
|
|
81000056: 0000 unimp
|
|
81000058: 0036 c.slli zero,0xd
|
|
8100005a: 0000 unimp
|
|
8100005c: 00000037 lui zero,0x0
|
|
81000060: 0038 addi a4,sp,8
|
|
81000062: 0000 unimp
|
|
81000064: 0039 c.nop 14
|
|
81000066: 0000 unimp
|
|
81000068: 0061 c.nop 24
|
|
8100006a: 0000 unimp
|
|
8100006c: 0062 c.slli zero,0x18
|
|
8100006e: 0000 unimp
|
|
81000070: 00000063 beqz zero,81000070 <main+0xffe9a8>
|
|
81000074: 0064 addi s1,sp,12
|
|
81000076: 0000 unimp
|
|
81000078: 0065 c.nop 25
|
|
8100007a: 0000 unimp
|
|
8100007c: 0066 c.slli zero,0x19
|
|
8100007e: 0000 unimp
|
|
81000080: 000a c.slli zero,0x2
|
|
81000082: 0000 unimp
|
|
81000084: 0030 addi a2,sp,8
|
|
81000086: 0000 unimp
|
|
81000088: 0031 c.nop 12
|
|
8100008a: 0000 unimp
|
|
8100008c: 0032 c.slli zero,0xc
|
|
8100008e: 0000 unimp
|
|
81000090: 00000033 add zero,zero,zero
|
|
81000094: 0034 addi a3,sp,8
|
|
81000096: 0000 unimp
|
|
81000098: 0035 c.nop 13
|
|
8100009a: 0000 unimp
|
|
8100009c: 0036 c.slli zero,0xd
|
|
8100009e: 0000 unimp
|
|
810000a0: 00000037 lui zero,0x0
|
|
810000a4: 0038 addi a4,sp,8
|
|
810000a6: 0000 unimp
|
|
810000a8: 0039 c.nop 14
|
|
810000aa: 0000 unimp
|
|
810000ac: 0061 c.nop 24
|
|
810000ae: 0000 unimp
|
|
810000b0: 0062 c.slli zero,0x18
|
|
810000b2: 0000 unimp
|
|
810000b4: 00000063 beqz zero,810000b4 <main+0xffe9ec>
|
|
810000b8: 0064 addi s1,sp,12
|
|
810000ba: 0000 unimp
|
|
810000bc: 0065 c.nop 25
|
|
810000be: 0000 unimp
|
|
810000c0: 0066 c.slli zero,0x19
|
|
810000c2: 0000 unimp
|
|
810000c4: 7366664f fnmadd.d fa2,fa2,fs6,fa4,unknown
|
|
810000c8: 7465 lui s0,0xffff9
|
|
810000ca: 203a fld ft0,392(sp)
|
|
810000cc: 0000 unimp
|
|
810000ce: 0000 unimp
|
|
810000d0: 0030 addi a2,sp,8
|
|
810000d2: 0000 unimp
|
|
810000d4: 0031 c.nop 12
|
|
810000d6: 0000 unimp
|
|
810000d8: 0032 c.slli zero,0xc
|
|
810000da: 0000 unimp
|
|
810000dc: 00000033 add zero,zero,zero
|
|
810000e0: 0034 addi a3,sp,8
|
|
810000e2: 0000 unimp
|
|
810000e4: 0035 c.nop 13
|
|
810000e6: 0000 unimp
|
|
810000e8: 0036 c.slli zero,0xd
|
|
810000ea: 0000 unimp
|
|
810000ec: 00000037 lui zero,0x0
|
|
810000f0: 0038 addi a4,sp,8
|
|
810000f2: 0000 unimp
|
|
810000f4: 0039 c.nop 14
|
|
810000f6: 0000 unimp
|
|
810000f8: 0061 c.nop 24
|
|
810000fa: 0000 unimp
|
|
810000fc: 0062 c.slli zero,0x18
|
|
810000fe: 0000 unimp
|
|
81000100: 00000063 beqz zero,81000100 <main+0xffea38>
|
|
81000104: 0064 addi s1,sp,12
|
|
81000106: 0000 unimp
|
|
81000108: 0065 c.nop 25
|
|
8100010a: 0000 unimp
|
|
8100010c: 0066 c.slli zero,0x19
|
|
8100010e: 0000 unimp
|
|
81000110: 2d2d jal 8100074a <q+0x42e>
|
|
81000112: 2d2d jal 8100074c <q+0x430>
|
|
81000114: 2d2d jal 8100074e <q+0x432>
|
|
81000116: 2d2d jal 81000750 <q+0x434>
|
|
81000118: 2d2d jal 81000752 <q+0x436>
|
|
8100011a: 2d2d jal 81000754 <q+0x438>
|
|
8100011c: 2d2d jal 81000756 <q+0x43a>
|
|
8100011e: 2d2d jal 81000758 <q+0x43c>
|
|
81000120: 2d2d jal 8100075a <q+0x43e>
|
|
81000122: 2d2d jal 8100075c <q+0x440>
|
|
81000124: 2d2d jal 8100075e <q+0x442>
|
|
81000126: 2d2d jal 81000760 <q+0x444>
|
|
81000128: 2d2d jal 81000762 <q+0x446>
|
|
8100012a: 2d2d jal 81000764 <q+0x448>
|
|
8100012c: 2d2d jal 81000766 <q+0x44a>
|
|
8100012e: 0a2d addi s4,s4,11
|
|
81000130: 0000 unimp
|
|
81000132: 0000 unimp
|
|
81000134: 000a c.slli zero,0x2
|
|
81000136: 0000 unimp
|
|
81000138: 0020 addi s0,sp,8
|
|
8100013a: 0000 unimp
|
|
8100013c: 2d0a fld fs10,128(sp)
|
|
8100013e: 2d2d jal 81000778 <q+0x45c>
|
|
81000140: 2d2d jal 8100077a <q+0x45e>
|
|
81000142: 2d2d jal 8100077c <q+0x460>
|
|
81000144: 2d2d jal 8100077e <q+0x462>
|
|
81000146: 2d2d jal 81000780 <q+0x464>
|
|
81000148: 2d2d jal 81000782 <q+0x466>
|
|
8100014a: 2d2d jal 81000784 <q+0x468>
|
|
8100014c: 2d2d jal 81000786 <q+0x46a>
|
|
8100014e: 2d2d jal 81000788 <q+0x46c>
|
|
81000150: 2d2d jal 8100078a <q+0x46e>
|
|
81000152: 2d2d jal 8100078c <q+0x470>
|
|
81000154: 2d2d jal 8100078e <q+0x472>
|
|
81000156: 2d2d jal 81000790 <q+0x474>
|
|
81000158: 2d2d jal 81000792 <q+0x476>
|
|
8100015a: 2d2d jal 81000794 <q+0x478>
|
|
8100015c: 000a c.slli zero,0x2
|
|
8100015e: 0000 unimp
|
|
81000160: 0a0a slli s4,s4,0x2
|
|
81000162: 614d addi sp,sp,176
|
|
81000164: 7274 flw fa3,100(a2)
|
|
81000166: 7869 lui a6,0xffffa
|
|
81000168: 6d20 flw fs0,88(a0)
|
|
8100016a: 6c75 lui s8,0x1d
|
|
8100016c: 6974 flw fa3,84(a0)
|
|
8100016e: 6c70 flw fa2,92(s0)
|
|
81000170: 6369 lui t1,0x1a
|
|
81000172: 7461 lui s0,0xffff8
|
|
81000174: 6f69 lui t5,0x1a
|
|
81000176: 0a6e slli s4,s4,0x1b
|
|
...
|
|
|
|
Disassembly of section .data:
|
|
|
|
8100017c <hextoa>:
|
|
8100017c: 0000 unimp
|
|
8100017e: 8100 0x8100
|
|
81000180: 0004 0x4
|
|
81000182: 8100 0x8100
|
|
81000184: 0008 0x8
|
|
81000186: 8100 0x8100
|
|
81000188: 000c 0xc
|
|
8100018a: 8100 0x8100
|
|
8100018c: 0010 0x10
|
|
8100018e: 8100 0x8100
|
|
81000190: 0014 0x14
|
|
81000192: 8100 0x8100
|
|
81000194: 0018 0x18
|
|
81000196: 8100 0x8100
|
|
81000198: 001c 0x1c
|
|
8100019a: 8100 0x8100
|
|
8100019c: 0020 addi s0,sp,8
|
|
8100019e: 8100 0x8100
|
|
810001a0: 0024 addi s1,sp,8
|
|
810001a2: 8100 0x8100
|
|
810001a4: 0028 addi a0,sp,8
|
|
810001a6: 8100 0x8100
|
|
810001a8: 002c addi a1,sp,8
|
|
810001aa: 8100 0x8100
|
|
810001ac: 0030 addi a2,sp,8
|
|
810001ae: 8100 0x8100
|
|
810001b0: 0034 addi a3,sp,8
|
|
810001b2: 8100 0x8100
|
|
810001b4: 0038 addi a4,sp,8
|
|
810001b6: 8100 0x8100
|
|
810001b8: 003c addi a5,sp,8
|
|
810001ba: 8100 0x8100
|
|
|
|
810001bc <hextoa>:
|
|
810001bc: 0040 addi s0,sp,4
|
|
810001be: 8100 0x8100
|
|
810001c0: 0044 addi s1,sp,4
|
|
810001c2: 8100 0x8100
|
|
810001c4: 0048 addi a0,sp,4
|
|
810001c6: 8100 0x8100
|
|
810001c8: 004c addi a1,sp,4
|
|
810001ca: 8100 0x8100
|
|
810001cc: 0050 addi a2,sp,4
|
|
810001ce: 8100 0x8100
|
|
810001d0: 0054 addi a3,sp,4
|
|
810001d2: 8100 0x8100
|
|
810001d4: 0058 addi a4,sp,4
|
|
810001d6: 8100 0x8100
|
|
810001d8: 005c addi a5,sp,4
|
|
810001da: 8100 0x8100
|
|
810001dc: 0060 addi s0,sp,12
|
|
810001de: 8100 0x8100
|
|
810001e0: 0064 addi s1,sp,12
|
|
810001e2: 8100 0x8100
|
|
810001e4: 0068 addi a0,sp,12
|
|
810001e6: 8100 0x8100
|
|
810001e8: 006c addi a1,sp,12
|
|
810001ea: 8100 0x8100
|
|
810001ec: 0070 addi a2,sp,12
|
|
810001ee: 8100 0x8100
|
|
810001f0: 0074 addi a3,sp,12
|
|
810001f2: 8100 0x8100
|
|
810001f4: 0078 addi a4,sp,12
|
|
810001f6: 8100 0x8100
|
|
810001f8: 007c addi a5,sp,12
|
|
810001fa: 8100 0x8100
|
|
|
|
810001fc <hextoa>:
|
|
810001fc: 0084 addi s1,sp,64
|
|
810001fe: 8100 0x8100
|
|
81000200: 0088 addi a0,sp,64
|
|
81000202: 8100 0x8100
|
|
81000204: 008c addi a1,sp,64
|
|
81000206: 8100 0x8100
|
|
81000208: 0090 addi a2,sp,64
|
|
8100020a: 8100 0x8100
|
|
8100020c: 0094 addi a3,sp,64
|
|
8100020e: 8100 0x8100
|
|
81000210: 0098 addi a4,sp,64
|
|
81000212: 8100 0x8100
|
|
81000214: 009c addi a5,sp,64
|
|
81000216: 8100 0x8100
|
|
81000218: 00a0 addi s0,sp,72
|
|
8100021a: 8100 0x8100
|
|
8100021c: 00a4 addi s1,sp,72
|
|
8100021e: 8100 0x8100
|
|
81000220: 00a8 addi a0,sp,72
|
|
81000222: 8100 0x8100
|
|
81000224: 00ac addi a1,sp,72
|
|
81000226: 8100 0x8100
|
|
81000228: 00b0 addi a2,sp,72
|
|
8100022a: 8100 0x8100
|
|
8100022c: 00b4 addi a3,sp,72
|
|
8100022e: 8100 0x8100
|
|
81000230: 00b8 addi a4,sp,72
|
|
81000232: 8100 0x8100
|
|
81000234: 00bc addi a5,sp,72
|
|
81000236: 8100 0x8100
|
|
81000238: 00c0 addi s0,sp,68
|
|
8100023a: 8100 0x8100
|
|
|
|
8100023c <hextoa>:
|
|
8100023c: 00d0 addi a2,sp,68
|
|
8100023e: 8100 0x8100
|
|
81000240: 00d4 addi a3,sp,68
|
|
81000242: 8100 0x8100
|
|
81000244: 00d8 addi a4,sp,68
|
|
81000246: 8100 0x8100
|
|
81000248: 00dc addi a5,sp,68
|
|
8100024a: 8100 0x8100
|
|
8100024c: 00e0 addi s0,sp,76
|
|
8100024e: 8100 0x8100
|
|
81000250: 00e4 addi s1,sp,76
|
|
81000252: 8100 0x8100
|
|
81000254: 00e8 addi a0,sp,76
|
|
81000256: 8100 0x8100
|
|
81000258: 00ec addi a1,sp,76
|
|
8100025a: 8100 0x8100
|
|
8100025c: 00f0 addi a2,sp,76
|
|
8100025e: 8100 0x8100
|
|
81000260: 00f4 addi a3,sp,76
|
|
81000262: 8100 0x8100
|
|
81000264: 00f8 addi a4,sp,76
|
|
81000266: 8100 0x8100
|
|
81000268: 00fc addi a5,sp,76
|
|
8100026a: 8100 0x8100
|
|
8100026c: 0100 addi s0,sp,128
|
|
8100026e: 8100 0x8100
|
|
81000270: 0104 addi s1,sp,128
|
|
81000272: 8100 0x8100
|
|
81000274: 0108 addi a0,sp,128
|
|
81000276: 8100 0x8100
|
|
81000278: 010c addi a1,sp,128
|
|
8100027a: 8100 0x8100
|
|
|
|
Disassembly of section .bss:
|
|
|
|
8100027c <done>:
|
|
...
|
|
|
|
81000298 <main_sp>:
|
|
81000298: 0000 unimp
|
|
...
|
|
|
|
8100029c <context>:
|
|
...
|
|
|
|
8100031c <q>:
|
|
...
|
|
|
|
8100293c <done>:
|
|
...
|
|
|
|
81002958 <main_sp>:
|
|
81002958: 0000 unimp
|
|
...
|
|
|
|
8100295c <mat_mult_args>:
|
|
...
|
|
|
|
81002970 <mat_r_args>:
|
|
...
|
|
|
|
81002988 <mat_e_args>:
|
|
...
|
|
|
|
810029a0 <x>:
|
|
...
|
|
|
|
810039a0 <y>:
|
|
...
|
|
|
|
810049a0 <z>:
|
|
...
|
|
|
|
810059a0 <done>:
|
|
...
|
|
|
|
810059bc <main_sp>:
|
|
810059bc: 0000 unimp
|
|
...
|
|
|
|
Disassembly of section .comment:
|
|
|
|
82000000 <.comment>:
|
|
82000000: 3a434347 fmsub.d ft6,ft6,ft4,ft7,rmm
|
|
82000004: 2820 fld fs0,80(s0)
|
|
82000006: 29554e47 fmsub.s ft8,fa0,fs5,ft5,rmm
|
|
8200000a: 3820 fld fs0,112(s0)
|
|
8200000c: 322e fld ft4,232(sp)
|
|
8200000e: 302e fld ft0,232(sp)
|
|
...
|