From 877ec63b6988c3685ffbe7edd66c0d46862f5a2b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Albin=20Ahlb=C3=A4ck?= Date: Mon, 2 Dec 2024 19:25:26 +0000 Subject: [PATCH] bla --- dev/gen_x86_aorsrsh.jl | 2 +- src/mpn_extras/test/t-aorsrsh_n.c | 2 +- .../x86_64/broadwell/aorsrsh_hard.asm | 30 +++++++++---------- 3 files changed, 17 insertions(+), 17 deletions(-) diff --git a/dev/gen_x86_aorsrsh.jl b/dev/gen_x86_aorsrsh.jl index c11655d8fc..8881a996e5 100644 --- a/dev/gen_x86_aorsrsh.jl +++ b/dev/gen_x86_aorsrsh.jl @@ -119,7 +119,7 @@ function aorsrsh(n::Int; is_add::Bool = true) mov( s3, rp(ix)) elseif ix == n - 1 mov( ap(ix), s0) - sub( s1, s0) + sbb( s1, s0) mov( s0, rp(ix)) else mov( ap(ix), s3) diff --git a/src/mpn_extras/test/t-aorsrsh_n.c b/src/mpn_extras/test/t-aorsrsh_n.c index 25d9075af9..24709f0e49 100644 --- a/src/mpn_extras/test/t-aorsrsh_n.c +++ b/src/mpn_extras/test/t-aorsrsh_n.c @@ -102,7 +102,7 @@ TEST_FUNCTION_START(flint_mpn_aorsrsh_n, state) result = (cf == cg && mpn_cmp(fp, gp, n) == 0); if (!result) TEST_FUNCTION_FAIL( - "%s:\n" + "function: %s\n" "aliasing: %s\n" "ix = %wd\n" "n = %wd\n" diff --git a/src/mpn_extras/x86_64/broadwell/aorsrsh_hard.asm b/src/mpn_extras/x86_64/broadwell/aorsrsh_hard.asm index ec24c45e30..ed6d264c06 100644 --- a/src/mpn_extras/x86_64/broadwell/aorsrsh_hard.asm +++ b/src/mpn_extras/x86_64/broadwell/aorsrsh_hard.asm @@ -1066,7 +1066,7 @@ PROLOGUE(flint_mpn_subrsh_2) sub s2, tnc mov tnc, 0*8(rp) mov 1*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 1*8(rp) setc R8(sx) ret @@ -1094,7 +1094,7 @@ PROLOGUE(flint_mpn_subrsh_3) sbb s2, s3 mov s3, 1*8(rp) mov 2*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 2*8(rp) pop s3 setc R8(sx) @@ -1130,7 +1130,7 @@ PROLOGUE(flint_mpn_subrsh_4) sbb s2, s3 mov s3, 2*8(rp) mov 3*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 3*8(rp) pop s3 setc R8(sx) @@ -1173,7 +1173,7 @@ PROLOGUE(flint_mpn_subrsh_5) sbb s2, s3 mov s3, 3*8(rp) mov 4*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 4*8(rp) pop s3 setc R8(sx) @@ -1223,7 +1223,7 @@ PROLOGUE(flint_mpn_subrsh_6) sbb s2, s3 mov s3, 4*8(rp) mov 5*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 5*8(rp) pop s3 setc R8(sx) @@ -1280,7 +1280,7 @@ PROLOGUE(flint_mpn_subrsh_7) sbb s2, s3 mov s3, 5*8(rp) mov 6*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 6*8(rp) pop s3 setc R8(sx) @@ -1344,7 +1344,7 @@ PROLOGUE(flint_mpn_subrsh_8) sbb s2, s3 mov s3, 6*8(rp) mov 7*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 7*8(rp) pop s3 setc R8(sx) @@ -1415,7 +1415,7 @@ PROLOGUE(flint_mpn_subrsh_9) sbb s2, s3 mov s3, 7*8(rp) mov 8*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 8*8(rp) pop s3 setc R8(sx) @@ -1493,7 +1493,7 @@ PROLOGUE(flint_mpn_subrsh_10) sbb s2, s3 mov s3, 8*8(rp) mov 9*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 9*8(rp) pop s3 setc R8(sx) @@ -1578,7 +1578,7 @@ PROLOGUE(flint_mpn_subrsh_11) sbb s2, s3 mov s3, 9*8(rp) mov 10*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 10*8(rp) pop s3 setc R8(sx) @@ -1670,7 +1670,7 @@ PROLOGUE(flint_mpn_subrsh_12) sbb s2, s3 mov s3, 10*8(rp) mov 11*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 11*8(rp) pop s3 setc R8(sx) @@ -1769,7 +1769,7 @@ PROLOGUE(flint_mpn_subrsh_13) sbb s2, s3 mov s3, 11*8(rp) mov 12*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 12*8(rp) pop s3 setc R8(sx) @@ -1875,7 +1875,7 @@ PROLOGUE(flint_mpn_subrsh_14) sbb s2, s3 mov s3, 12*8(rp) mov 13*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 13*8(rp) pop s3 setc R8(sx) @@ -1988,7 +1988,7 @@ PROLOGUE(flint_mpn_subrsh_15) sbb s2, s3 mov s3, 13*8(rp) mov 14*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 14*8(rp) pop s3 setc R8(sx) @@ -2108,7 +2108,7 @@ PROLOGUE(flint_mpn_subrsh_16) sbb s2, s3 mov s3, 14*8(rp) mov 15*8(ap), s0 - sub s1, s0 + sbb s1, s0 mov s0, 15*8(rp) pop s3 setc R8(sx)