# Test for mul

.org 0
# Provide program starting address to linker
.global _start

.extern mul
.extern tohex

/* newlib system calls */
.set SYSEXIT,  93
.set SYSWRITE, 64

.section .rodata

inputs:
    .word 3
    .word 5

    .word 21
    .word 3

    .word 0xFFFF
    .word 100

    .word -7
    .word 3
inputs_end:
  # llvm doesn't like this: error: expected relocatable expression
  #.set inputs_end, .-inputs
  # turns out it was right. That was calculating a length, which was
  # incorrect for how it was used for looping.

.section .bss

buf: .skip 9

.text

_start:
    li a0, '\n'
    la a1, buf
    sb a0, 8(a1)        # append newline to buf

    la s0, inputs       # init loop variables
    la s1, inputs_end
loop:
    lw a0, 0(s0)        # multiplicand
    lw a1, 4(s0)        # multiplier
    jal mul
    # TODO: Format as an actual decimal
    la a1, buf
    jal tohex

    li t0, SYSWRITE     # "write" syscall
    li a0, 1            # 1 = standard output (stdout)
    la a1, buf          # load address of output string
    li a2, 9            # length of output string
    ecall               # invoke syscall to print the string

    addi s0, s0, 8      # increment input pointer to next pair of 64-bit inputs
    bltu s0, s1, loop   # if the input address is less than inputs_end, loop

    li t0, SYSEXIT      # "exit" syscall
    la a0, 0            # Use 0 return code
    ecall               # invoke syscall to terminate the program