  1. # r0=temp
  2. # r1=source ptr (unaligned)
  3. # r2=dest ptr (aligned)
  4. # r3=number of words to copy
  5. lp:   lwr   r0, 3(r1)     # <-- this ends up having a false dependency on r0 from the previous iter
  6.       lwl   r0, 0(r1)
  7.       sw    r0, 0(r2)
  8.       addiu r1, r1, 4
  9.       addiu r2, r2, 4
  10.       addiu r3, r3, -1
  11.       bgtz  r3, lp
