aboutsummaryrefslogtreecommitdiffstats
path: root/include
diff options
context:
space:
mode:
authorMITSUNARI Shigeo <herumi@nifty.com>2017-01-11 11:16:31 +0800
committerMITSUNARI Shigeo <herumi@nifty.com>2017-01-11 11:16:36 +0800
commitbf035e3692e283b687d6ae2bb8e111b5c088b612 (patch)
treef10201f34fe46c61920bfc7643bd5144d7330668 /include
parent7b99668980fd9346e319d828f95b64758b64cfd0 (diff)
downloadtangerine-mcl-bf035e3692e283b687d6ae2bb8e111b5c088b612.tar.gz
tangerine-mcl-bf035e3692e283b687d6ae2bb8e111b5c088b612.tar.zst
tangerine-mcl-bf035e3692e283b687d6ae2bb8e111b5c088b612.zip
a little faster fp2_mul for llvm
Diffstat (limited to 'include')
-rw-r--r--include/mcl/fp_tower.hpp11
-rw-r--r--include/mcl/op.hpp2
2 files changed, 12 insertions, 1 deletions
diff --git a/include/mcl/fp_tower.hpp b/include/mcl/fp_tower.hpp
index a0edde5..28f1772 100644
--- a/include/mcl/fp_tower.hpp
+++ b/include/mcl/fp_tower.hpp
@@ -214,7 +214,11 @@ public:
if (op.isFastMod) {
op.fp2_mul = fp2_mulW;
} else if (!op.isFullBit) {
- op.fp2_mul = fp2_mulUseDblUseNCW;
+ if (sizeof(Fp) * 8 == op.N * fp::UnitBitSize && op.fp2_mulNF) {
+ op.fp2_mul = fp2_mulNFW;
+ } else {
+ op.fp2_mul = fp2_mulUseDblUseNCW;
+ }
} else {
op.fp2_mul = fp2_mulUseDblW;
}
@@ -306,6 +310,11 @@ private:
FpDbl::sub(d1, d1, d2); // ac - bd
FpDbl::mod(pz[0], d1); // set z0
}
+ static void fp2_mulNFW(Unit *z, const Unit *x, const Unit *y)
+ {
+ const fp::Op& op = Fp::op_;
+ op.fp2_mulNF(z, x, y, op.p);
+ }
static void fp2_mulUseDblUseNCW(Unit *z, const Unit *x, const Unit *y)
{
const Fp *px = reinterpret_cast<const Fp*>(x);
diff --git a/include/mcl/op.hpp b/include/mcl/op.hpp
index 0e5cba9..159047a 100644
--- a/include/mcl/op.hpp
+++ b/include/mcl/op.hpp
@@ -123,6 +123,7 @@ struct Op {
void3u fp2_add;
void3u fp2_sub;
void3u fp2_mul;
+ void4u fp2_mulNF;
void2u fp2_neg;
void2u fp2_inv;
void2u fp2_sqr;
@@ -188,6 +189,7 @@ struct Op {
fp2_add = 0;
fp2_sub = 0;
fp2_mul = 0;
+ fp2_mulNF = 0;
fp2_neg = 0;
fp2_inv = 0;
fp2_sqr = 0;