From 35db3f90b3be29edbc0e3b4abc0d683be062c558 Mon Sep 17 00:00:00 2001 From: MITSUNARI Shigeo Date: Thu, 25 Feb 2021 14:15:52 +0900 Subject: [PATCH] use fqrPre + mod for N = 4 --- src/fp_generator.hpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/fp_generator.hpp b/src/fp_generator.hpp index c839873..6a59244 100644 --- a/src/fp_generator.hpp +++ b/src/fp_generator.hpp @@ -1267,7 +1267,7 @@ private: return func; } if (pn_ == 4 && useMulx_) { -#if 1 +#if 0 // sqr(y, x) = mul(y, x, x) #ifdef XBYAK64_WIN mov(r8, rdx); @@ -1275,7 +1275,7 @@ private: mov(rdx, rsi); #endif jmp((const void*)op_->fp_mulA_); -#else // (sqrPre + mod) is slower than mul +#else // (sqrPre + mod) is faster than mul StackFrame sf(this, 3, 10 | UseRDX, 8 * 8); Pack t = sf.t; t.append(sf.p[2]);