|
|
|
@@ -452,11 +452,6 @@ |
|
|
|
|
|
|
|
MOVDDUP(4 * SIZE, A1, a1) |
|
|
|
|
|
|
|
movsd 0 * SIZE(YY), yy1 |
|
|
|
movhpd 1 * SIZE(YY), yy1 |
|
|
|
movsd 2 * SIZE(YY), yy2 |
|
|
|
movhpd 3 * SIZE(YY), yy2 |
|
|
|
|
|
|
|
movapd 8 * SIZE(XX), xtemp1 |
|
|
|
movapd 10 * SIZE(XX), xtemp2 |
|
|
|
movapd 12 * SIZE(XX), xtemp3 |
|
|
|
@@ -475,6 +470,12 @@ |
|
|
|
MOVDDUP(6 * SIZE - (4 * SIZE), A2, a2) |
|
|
|
ALIGN_3 |
|
|
|
|
|
|
|
.L12_prep: |
|
|
|
movsd 0 * SIZE(YY), yy1 |
|
|
|
movhpd 1 * SIZE(YY), yy1 |
|
|
|
movsd 2 * SIZE(YY), yy2 |
|
|
|
movhpd 3 * SIZE(YY), yy2 |
|
|
|
|
|
|
|
.L12: |
|
|
|
movapd xtemp1, xt1 |
|
|
|
mulpd a1, xt1 |
|
|
|
@@ -608,8 +609,6 @@ |
|
|
|
|
|
|
|
movlpd yy2, 6 * SIZE(YY) |
|
|
|
movhpd yy2, 7 * SIZE(YY) |
|
|
|
movsd 10 * SIZE(YY), yy2 |
|
|
|
movhpd 11 * SIZE(YY), yy2 |
|
|
|
|
|
|
|
movapd xtemp2, xt1 |
|
|
|
movapd 18 * SIZE(XX), xtemp2 |
|
|
|
@@ -621,8 +620,6 @@ |
|
|
|
|
|
|
|
movlpd yy1, 4 * SIZE(YY) |
|
|
|
movhpd yy1, 5 * SIZE(YY) |
|
|
|
movsd 8 * SIZE(YY), yy1 |
|
|
|
movhpd 9 * SIZE(YY), yy1 |
|
|
|
|
|
|
|
subq $-16 * SIZE, XX |
|
|
|
addq $ 8 * SIZE, YY |
|
|
|
@@ -630,7 +627,8 @@ |
|
|
|
addq $ 8 * SIZE, A2 |
|
|
|
|
|
|
|
decq I |
|
|
|
jg .L12 |
|
|
|
jg .L12_prep |
|
|
|
jmp .L15 |
|
|
|
ALIGN_3 |
|
|
|
|
|
|
|
.L14: |
|
|
|
@@ -641,7 +639,6 @@ |
|
|
|
jle .L16 |
|
|
|
|
|
|
|
MOVDDUP(6 * SIZE - (4 * SIZE), A2, a2) |
|
|
|
jmp .L15_pastcheck |
|
|
|
|
|
|
|
.L15: |
|
|
|
movq M, I |
|
|
|
@@ -650,6 +647,11 @@ |
|
|
|
testq $2, I |
|
|
|
jle .L16 |
|
|
|
|
|
|
|
movsd 0 * SIZE(YY), yy1 |
|
|
|
movhpd 1 * SIZE(YY), yy1 |
|
|
|
movsd 2 * SIZE(YY), yy2 |
|
|
|
movhpd 3 * SIZE(YY), yy2 |
|
|
|
|
|
|
|
.L15_pastcheck: |
|
|
|
movapd xtemp1, xt1 |
|
|
|
mulpd a1, xt1 |
|
|
|
@@ -705,8 +707,6 @@ |
|
|
|
|
|
|
|
movlpd yy2, 2 * SIZE(YY) |
|
|
|
movhpd yy2, 3 * SIZE(YY) |
|
|
|
movsd 6 * SIZE(YY), yy2 |
|
|
|
movhpd 7 * SIZE(YY), yy2 |
|
|
|
|
|
|
|
movapd xtemp2, xt1 |
|
|
|
movapd 10 * SIZE(XX), xtemp2 |
|
|
|
@@ -717,8 +717,6 @@ |
|
|
|
|
|
|
|
movlpd yy1, 0 * SIZE(YY) |
|
|
|
movhpd yy1, 1 * SIZE(YY) |
|
|
|
movsd 4 * SIZE(YY), yy1 |
|
|
|
movhpd 5 * SIZE(YY), yy1 |
|
|
|
|
|
|
|
addq $4 * SIZE, YY |
|
|
|
addq $4 * SIZE, A1 |
|
|
|
@@ -731,6 +729,9 @@ |
|
|
|
|
|
|
|
MOVDDUP(1 * SIZE, A1, a2) |
|
|
|
|
|
|
|
movsd 0 * SIZE(YY), yy1 |
|
|
|
movhpd 1 * SIZE(YY), yy1 |
|
|
|
|
|
|
|
movapd xtemp1, xt1 |
|
|
|
mulpd a1, xt1 |
|
|
|
mulpd atemp1, a1 |
|
|
|
|