78 lines
3.7 KiB
C
78 lines
3.7 KiB
C
/*
|
|
* Copyright 2005-2021 The OpenSSL Project Authors. All Rights Reserved.
|
|
*
|
|
* Licensed under the Apache License 2.0 (the "License"). You may not use
|
|
* this file except in compliance with the License. You can obtain a copy
|
|
* in the file LICENSE in the source distribution or at
|
|
* https://www.openssl.org/source/license.html
|
|
*/
|
|
|
|
#include <stdlib.h>
|
|
#include <openssl/bn.h>
|
|
#include "internal/cryptlib.h"
|
|
#include "crypto/sparc_arch.h"
|
|
#include "bn_local.h" /* for definition of bn_mul_mont */
|
|
|
|
int bn_mul_mont(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp,
|
|
const BN_ULONG *np, const BN_ULONG *n0, int num)
|
|
{
|
|
int bn_mul_mont_vis3(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp,
|
|
const BN_ULONG *np, const BN_ULONG *n0, int num);
|
|
int bn_mul_mont_fpu(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp,
|
|
const BN_ULONG *np, const BN_ULONG *n0, int num);
|
|
int bn_mul_mont_int(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp,
|
|
const BN_ULONG *np, const BN_ULONG *n0, int num);
|
|
|
|
if (!(num & 1) && num >= 6) {
|
|
if ((num & 15) == 0 && num <= 64 &&
|
|
(OPENSSL_sparcv9cap_P[1] & (CFR_MONTMUL | CFR_MONTSQR)) ==
|
|
(CFR_MONTMUL | CFR_MONTSQR)) {
|
|
typedef int (*bn_mul_mont_f) (BN_ULONG *rp, const BN_ULONG *ap,
|
|
const BN_ULONG *bp,
|
|
const BN_ULONG *np,
|
|
const BN_ULONG *n0);
|
|
int bn_mul_mont_t4_8(BN_ULONG *rp, const BN_ULONG *ap,
|
|
const BN_ULONG *bp, const BN_ULONG *np,
|
|
const BN_ULONG *n0);
|
|
int bn_mul_mont_t4_16(BN_ULONG *rp, const BN_ULONG *ap,
|
|
const BN_ULONG *bp, const BN_ULONG *np,
|
|
const BN_ULONG *n0);
|
|
int bn_mul_mont_t4_24(BN_ULONG *rp, const BN_ULONG *ap,
|
|
const BN_ULONG *bp, const BN_ULONG *np,
|
|
const BN_ULONG *n0);
|
|
int bn_mul_mont_t4_32(BN_ULONG *rp, const BN_ULONG *ap,
|
|
const BN_ULONG *bp, const BN_ULONG *np,
|
|
const BN_ULONG *n0);
|
|
static const bn_mul_mont_f funcs[4] = {
|
|
bn_mul_mont_t4_8, bn_mul_mont_t4_16,
|
|
bn_mul_mont_t4_24, bn_mul_mont_t4_32
|
|
};
|
|
bn_mul_mont_f worker = funcs[num / 16 - 1];
|
|
|
|
if ((*worker) (rp, ap, bp, np, n0))
|
|
return 1;
|
|
/* retry once and fall back */
|
|
if ((*worker) (rp, ap, bp, np, n0))
|
|
return 1;
|
|
return bn_mul_mont_vis3(rp, ap, bp, np, n0, num);
|
|
}
|
|
if ((OPENSSL_sparcv9cap_P[0] & SPARCV9_VIS3))
|
|
return bn_mul_mont_vis3(rp, ap, bp, np, n0, num);
|
|
else if (num >= 8 &&
|
|
/*
|
|
* bn_mul_mont_fpu doesn't use FMADD, we just use the
|
|
* flag to detect when FPU path is preferable in cases
|
|
* when current heuristics is unreliable. [it works
|
|
* out because FMADD-capable processors where FPU
|
|
* code path is undesirable are also VIS3-capable and
|
|
* VIS3 code path takes precedence.]
|
|
*/
|
|
( (OPENSSL_sparcv9cap_P[0] & SPARCV9_FMADD) ||
|
|
(OPENSSL_sparcv9cap_P[0] &
|
|
(SPARCV9_PREFER_FPU | SPARCV9_VIS1)) ==
|
|
(SPARCV9_PREFER_FPU | SPARCV9_VIS1) ))
|
|
return bn_mul_mont_fpu(rp, ap, bp, np, n0, num);
|
|
}
|
|
return bn_mul_mont_int(rp, ap, bp, np, n0, num);
|
|
}
|