|
@@ -402,3 +402,64 @@ xor_alpha_prefetch_2: \n\
|
|
|
.align 4 \n\
|
|
|
2: \n\
|
|
|
ldq $0,0($17) \n\
|
|
|
+ ldq $1,0($18) \n\
|
|
|
+ ldq $2,8($17) \n\
|
|
|
+ ldq $3,8($18) \n\
|
|
|
+ \n\
|
|
|
+ ldq $4,16($17) \n\
|
|
|
+ ldq $5,16($18) \n\
|
|
|
+ ldq $6,24($17) \n\
|
|
|
+ ldq $7,24($18) \n\
|
|
|
+ \n\
|
|
|
+ ldq $19,32($17) \n\
|
|
|
+ ldq $20,32($18) \n\
|
|
|
+ ldq $21,40($17) \n\
|
|
|
+ ldq $22,40($18) \n\
|
|
|
+ \n\
|
|
|
+ ldq $23,48($17) \n\
|
|
|
+ ldq $24,48($18) \n\
|
|
|
+ ldq $25,56($17) \n\
|
|
|
+ ldq $27,56($18) \n\
|
|
|
+ \n\
|
|
|
+ ldq $31,256($17) \n\
|
|
|
+ xor $0,$1,$0 # 8 cycles from $1 load \n\
|
|
|
+ ldq $31,256($18) \n\
|
|
|
+ xor $2,$3,$2 \n\
|
|
|
+ \n\
|
|
|
+ stq $0,0($17) \n\
|
|
|
+ xor $4,$5,$4 \n\
|
|
|
+ stq $2,8($17) \n\
|
|
|
+ xor $6,$7,$6 \n\
|
|
|
+ \n\
|
|
|
+ stq $4,16($17) \n\
|
|
|
+ xor $19,$20,$19 \n\
|
|
|
+ stq $6,24($17) \n\
|
|
|
+ xor $21,$22,$21 \n\
|
|
|
+ \n\
|
|
|
+ stq $19,32($17) \n\
|
|
|
+ xor $23,$24,$23 \n\
|
|
|
+ stq $21,40($17) \n\
|
|
|
+ xor $25,$27,$25 \n\
|
|
|
+ \n\
|
|
|
+ stq $23,48($17) \n\
|
|
|
+ subq $16,1,$16 \n\
|
|
|
+ stq $25,56($17) \n\
|
|
|
+ addq $17,64,$17 \n\
|
|
|
+ \n\
|
|
|
+ addq $18,64,$18 \n\
|
|
|
+ bgt $16,2b \n\
|
|
|
+ ret \n\
|
|
|
+ .end xor_alpha_prefetch_2 \n\
|
|
|
+ \n\
|
|
|
+ .align 3 \n\
|
|
|
+ .ent xor_alpha_prefetch_3 \n\
|
|
|
+xor_alpha_prefetch_3: \n\
|
|
|
+ .prologue 0 \n\
|
|
|
+ srl $16, 6, $16 \n\
|
|
|
+ \n\
|
|
|
+ ldq $31, 0($17) \n\
|
|
|
+ ldq $31, 0($18) \n\
|
|
|
+ ldq $31, 0($19) \n\
|
|
|
+ \n\
|
|
|
+ ldq $31, 64($17) \n\
|
|
|
+ ldq $31, 64($18) \n\
|