summaryrefslogtreecommitdiff
path: root/mpn
diff options
context:
space:
mode:
authortege <tege@gmplib.org>2001-12-20 09:27:34 +0100
committertege <tege@gmplib.org>2001-12-20 09:27:34 +0100
commiteddfc9bc19779094ac2d73aa2fe99c13c9241347 (patch)
tree9130d48572e68984af466ea742fdb9ac9aa644c2 /mpn
parent662808c53b441dc7f2ad72106866a052c102bf8d (diff)
downloadgmp-eddfc9bc19779094ac2d73aa2fe99c13c9241347.tar.gz
Make the new code actually work...
Diffstat (limited to 'mpn')
-rw-r--r--mpn/ia64/addmul_1.asm12
-rw-r--r--mpn/ia64/mul_1.asm12
2 files changed, 20 insertions, 4 deletions
diff --git a/mpn/ia64/addmul_1.asm b/mpn/ia64/addmul_1.asm
index a0b7b2479..1807b6f3a 100644
--- a/mpn/ia64/addmul_1.asm
+++ b/mpn/ia64/addmul_1.asm
@@ -54,8 +54,14 @@ PROLOGUE(mpn_addmul_1)
mov ar.ec = 7
} { .mii cmp.ne p6, p7 = r0, r0
mov pr.rot = 1<<16
- add r32 = 0, r0 C clear "carry in"
-} ;;
+ mov r32 = 0 C clear "carry in"
+} { .mib mov r33 = 0 C clear for cmp
+ mov r34 = 0 C clear for cmp
+ nop.b 0
+} { .mib mov r35 = 0 C clear for cmp
+ mov r36 = 0 C clear for cmp
+ nop.b 0 ;;
+}
.align 32
.Loop:
{ .mfi (p16) ldf8 f32 = [r17], 8 C *0,3,6,9,12,15,18
@@ -71,6 +77,8 @@ PROLOGUE(mpn_addmul_1)
(p22) st8 [r18] = r14, 8 C 2,5,8,11,14,17,*20
br.ctop.sptk .Loop ;;
}
+ (p6) add r8 = 1, r38
+ (p7) mov r8 = r38
mov pr = r22,0xfffffffffffffffe
mov ar.lc = r2
mov ar.ec = r20
diff --git a/mpn/ia64/mul_1.asm b/mpn/ia64/mul_1.asm
index 116ec30f8..dfb980485 100644
--- a/mpn/ia64/mul_1.asm
+++ b/mpn/ia64/mul_1.asm
@@ -54,8 +54,14 @@ PROLOGUE(mpn_mul_1)
mov ar.ec = 7
} { .mii cmp.ne p6, p7 = r0, r0
mov pr.rot = 1<<16
- add r32 = 0, r0 C clear "carry in"
-} ;;
+ mov r32 = 0 C clear "carry in"
+} { .mib mov r33 = 0 C clear for cmp
+ mov r34 = 0 C clear for cmp
+ nop.b 0
+} { .mib mov r35 = 0 C clear for cmp
+ mov r36 = 0 C clear for cmp
+ nop.b 0 ;;
+}
.align 32
.Loop:
{ .mfi (p16) ldf8 f32 = [r17], 8 C *0,3,6,9,12,15,18
@@ -71,6 +77,8 @@ PROLOGUE(mpn_mul_1)
(p22) st8 [r18] = r14, 8 C 2,5,8,11,14,17,*20
br.ctop.sptk .Loop ;;
}
+ (p6) add r8 = 1, r38
+ (p7) mov r8 = r38
mov pr = r22,0xfffffffffffffffe
mov ar.lc = r2
mov ar.ec = r20