crypto/elliptic: use a 4-bit sliding window for P-521 ScalarMult

name                    old time/op    new time/op    delta
pkg:crypto/elliptic goos:darwin goarch:amd64
ScalarBaseMult/P521-16    1.63ms ± 4%    1.00ms ± 1%  -38.69%  (p=0.000 n=10+8)
ScalarMult/P521-16        1.65ms ± 4%    0.99ms ± 2%  -40.15%  (p=0.000 n=10+10)
pkg:crypto/ecdsa goos:darwin goarch:amd64
Sign/P521-16              1.67ms ± 1%    1.12ms ± 2%  -32.82%  (p=0.000 n=8+10)
Verify/P521-16            3.10ms ± 2%    2.00ms ± 2%  -35.54%  (p=0.000 n=9+10)
GenerateKey/P521-16       1.53ms ± 1%    0.98ms ± 2%  -35.81%  (p=0.000 n=9+10)

Change-Id: I109e821399d71330a77d105496e227746cc3ea0d
Reviewed-on: https://go-review.googlesource.com/c/go/+/320072
Trust: Filippo Valsorda <filippo@golang.org>
Run-TryBot: Filippo Valsorda <filippo@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Julie Qiu <julie@golang.org>
This commit is contained in:
Filippo Valsorda 2021-05-14 13:03:45 -04:00
parent e39b854a67
commit d1dceafc29

View file

@ -6,6 +6,7 @@ package elliptic
import (
"crypto/elliptic/internal/fiat"
"crypto/subtle"
"math/big"
)
@ -243,13 +244,42 @@ func (curve p521Curve) ScalarMult(Bx, By *big.Int, scalar []byte) (*big.Int, *bi
B := newP521PointFromAffine(Bx, By)
p, t := newP521Point(), newP521Point()
// table holds the first 16 multiples of q. The explicit newP521Point calls
// get inlined, letting the allocations live on the stack.
var table = [16]*p521Point{
newP521Point(), newP521Point(), newP521Point(), newP521Point(),
newP521Point(), newP521Point(), newP521Point(), newP521Point(),
newP521Point(), newP521Point(), newP521Point(), newP521Point(),
newP521Point(), newP521Point(), newP521Point(), newP521Point(),
}
for i := 1; i < 16; i++ {
table[i].Add(table[i-1], B)
}
// Instead of doing the classic double-and-add chain, we do it with a
// four-bit window: we double four times, and then add [0-15]P.
for _, byte := range scalar {
for bitNum := 0; bitNum < 8; bitNum++ {
p.Double(p)
t.Add(p, B)
bit := (byte >> (7 - bitNum)) & 1
p.Select(t, p, int(bit))
p.Double(p)
p.Double(p)
p.Double(p)
p.Double(p)
for i := uint8(0); i < 16; i++ {
cond := subtle.ConstantTimeByteEq(byte>>4, i)
t.Select(table[i], t, cond)
}
p.Add(p, t)
p.Double(p)
p.Double(p)
p.Double(p)
p.Double(p)
for i := uint8(0); i < 16; i++ {
cond := subtle.ConstantTimeByteEq(byte&0b1111, i)
t.Select(table[i], t, cond)
}
p.Add(p, t)
}
return p.Affine()