The TONS implementation

;; Small performance test on
;; parallel operations...
entry "matrixperf"
        decl  integer, integer, matrix,
              matrix, matrix
        ; Set matrix dimension
        move r0, 100
        ; Set number of iterations
        move r1, 100
        ; Initialize matrices
        zero r2, r0
        add  r2, 0.01
        zero r3, r0
        add r3, 1
        zero r4, r0
        add r4, 10
        ; Run the loop
        loop r1
                mult r3, r2
                mult r4, r2
                decr r1
        ; Add return values
        add r4, r3
        ; And exit
        return r4