2022-11-22 11:02:37 +08:00
|
|
|
//go:build (amd64 && !purego) || (arm64 && !purego)
|
2022-01-21 11:24:10 +08:00
|
|
|
|
|
|
|
package sm4
|
|
|
|
|
|
|
|
import (
|
|
|
|
"crypto/cipher"
|
2023-03-08 15:39:48 +08:00
|
|
|
"os"
|
2022-01-21 11:24:10 +08:00
|
|
|
|
2022-08-18 14:49:35 +08:00
|
|
|
"github.com/emmansun/gmsm/internal/alias"
|
2024-01-24 13:11:09 +08:00
|
|
|
"github.com/emmansun/gmsm/internal/cpuid"
|
2022-01-21 11:24:10 +08:00
|
|
|
"golang.org/x/sys/cpu"
|
|
|
|
)
|
|
|
|
|
2023-03-08 15:39:48 +08:00
|
|
|
var supportSM4 = cpu.ARM64.HasSM4 && os.Getenv("DISABLE_SM4NI") != "1"
|
2024-01-24 13:11:09 +08:00
|
|
|
var supportsAES = cpuid.HasAES
|
|
|
|
var supportsGFMUL = cpuid.HasGFMUL
|
2023-07-04 10:04:15 +08:00
|
|
|
var useAVX2 = cpu.X86.HasAVX2
|
2023-07-03 12:00:27 +08:00
|
|
|
var useAVX = cpu.X86.HasAVX
|
2024-01-25 17:46:09 +08:00
|
|
|
var useAESNI4SingleBlock = os.Getenv("FORCE_SM4BLOCK_AESNI") == "1"
|
2022-01-21 11:24:10 +08:00
|
|
|
|
2022-04-29 12:09:04 +08:00
|
|
|
const (
|
|
|
|
INST_AES int = iota
|
|
|
|
INST_SM4
|
|
|
|
)
|
|
|
|
|
2022-01-21 11:24:10 +08:00
|
|
|
//go:noescape
|
2022-04-28 13:46:50 +08:00
|
|
|
func encryptBlocksAsm(xk *uint32, dst, src []byte, inst int)
|
2022-01-21 11:24:10 +08:00
|
|
|
|
|
|
|
//go:noescape
|
2022-04-28 13:46:50 +08:00
|
|
|
func encryptBlockAsm(xk *uint32, dst, src *byte, inst int)
|
2022-01-21 11:24:10 +08:00
|
|
|
|
|
|
|
//go:noescape
|
2022-04-28 13:46:50 +08:00
|
|
|
func expandKeyAsm(key *byte, ck, enc, dec *uint32, inst int)
|
2022-01-21 11:24:10 +08:00
|
|
|
|
|
|
|
type sm4CipherAsm struct {
|
|
|
|
sm4Cipher
|
|
|
|
batchBlocks int
|
|
|
|
blocksSize int
|
|
|
|
}
|
|
|
|
|
2022-04-29 12:09:04 +08:00
|
|
|
func newCipher(key []byte) (cipher.Block, error) {
|
2022-04-28 13:46:50 +08:00
|
|
|
if supportSM4 {
|
2022-04-29 12:09:04 +08:00
|
|
|
return newCipherNI(key)
|
2022-04-28 13:46:50 +08:00
|
|
|
}
|
2022-04-29 12:09:04 +08:00
|
|
|
|
|
|
|
if !supportsAES {
|
|
|
|
return newCipherGeneric(key)
|
|
|
|
}
|
|
|
|
|
|
|
|
blocks := 4
|
|
|
|
if useAVX2 {
|
|
|
|
blocks = 8
|
|
|
|
}
|
|
|
|
c := &sm4CipherAsm{sm4Cipher{make([]uint32, rounds), make([]uint32, rounds)}, blocks, blocks * BlockSize}
|
|
|
|
expandKeyAsm(&key[0], &ck[0], &c.enc[0], &c.dec[0], INST_AES)
|
|
|
|
if supportsGFMUL {
|
|
|
|
return &sm4CipherGCM{c}, nil
|
|
|
|
}
|
|
|
|
return c, nil
|
2022-04-28 13:46:50 +08:00
|
|
|
}
|
|
|
|
|
2022-04-29 12:09:04 +08:00
|
|
|
func (c *sm4CipherAsm) Concurrency() int { return c.batchBlocks }
|
|
|
|
|
2022-01-21 11:24:10 +08:00
|
|
|
func (c *sm4CipherAsm) Encrypt(dst, src []byte) {
|
|
|
|
if len(src) < BlockSize {
|
|
|
|
panic("sm4: input not full block")
|
|
|
|
}
|
|
|
|
if len(dst) < BlockSize {
|
|
|
|
panic("sm4: output not full block")
|
|
|
|
}
|
2022-08-18 14:49:35 +08:00
|
|
|
if alias.InexactOverlap(dst[:BlockSize], src[:BlockSize]) {
|
2022-01-21 11:24:10 +08:00
|
|
|
panic("sm4: invalid buffer overlap")
|
|
|
|
}
|
2024-01-25 17:46:09 +08:00
|
|
|
if useAESNI4SingleBlock {
|
|
|
|
encryptBlockAsm(&c.enc[0], &dst[0], &src[0], INST_AES)
|
|
|
|
} else {
|
|
|
|
encryptBlockGo(c.enc, dst, src)
|
2022-01-21 11:24:10 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *sm4CipherAsm) Decrypt(dst, src []byte) {
|
|
|
|
if len(src) < BlockSize {
|
|
|
|
panic("sm4: input not full block")
|
|
|
|
}
|
|
|
|
if len(dst) < BlockSize {
|
|
|
|
panic("sm4: output not full block")
|
|
|
|
}
|
2022-08-18 14:49:35 +08:00
|
|
|
if alias.InexactOverlap(dst[:BlockSize], src[:BlockSize]) {
|
2022-01-21 11:24:10 +08:00
|
|
|
panic("sm4: invalid buffer overlap")
|
|
|
|
}
|
2024-01-25 17:46:09 +08:00
|
|
|
if useAESNI4SingleBlock {
|
|
|
|
encryptBlockAsm(&c.dec[0], &dst[0], &src[0], INST_AES)
|
|
|
|
} else {
|
2024-01-31 13:08:51 +08:00
|
|
|
encryptBlockGo(c.dec, dst, src)
|
2024-01-25 17:46:09 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *sm4CipherAsm) EncryptBlocks(dst, src []byte) {
|
|
|
|
if len(src) < c.blocksSize {
|
|
|
|
panic("sm4: input not full blocks")
|
|
|
|
}
|
|
|
|
if len(dst) < c.blocksSize {
|
|
|
|
panic("sm4: output not full blocks")
|
|
|
|
}
|
|
|
|
if alias.InexactOverlap(dst[:c.blocksSize], src[:c.blocksSize]) {
|
|
|
|
panic("sm4: invalid buffer overlap")
|
|
|
|
}
|
|
|
|
encryptBlocksAsm(&c.enc[0], dst, src, INST_AES)
|
2022-01-21 11:24:10 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
func (c *sm4CipherAsm) DecryptBlocks(dst, src []byte) {
|
|
|
|
if len(src) < c.blocksSize {
|
|
|
|
panic("sm4: input not full blocks")
|
|
|
|
}
|
|
|
|
if len(dst) < c.blocksSize {
|
|
|
|
panic("sm4: output not full blocks")
|
|
|
|
}
|
2022-08-18 14:49:35 +08:00
|
|
|
if alias.InexactOverlap(dst[:c.blocksSize], src[:c.blocksSize]) {
|
2022-01-21 11:24:10 +08:00
|
|
|
panic("sm4: invalid buffer overlap")
|
|
|
|
}
|
2022-04-29 12:09:04 +08:00
|
|
|
encryptBlocksAsm(&c.dec[0], dst, src, INST_AES)
|
2022-01-21 11:24:10 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// expandKey is used by BenchmarkExpand to ensure that the asm implementation
|
|
|
|
// of key expansion is used for the benchmark when it is available.
|
|
|
|
func expandKey(key []byte, enc, dec []uint32) {
|
2022-04-28 13:46:50 +08:00
|
|
|
if supportSM4 {
|
2022-04-29 12:09:04 +08:00
|
|
|
expandKeyAsm(&key[0], &ck[0], &enc[0], &dec[0], INST_SM4)
|
2022-04-28 13:46:50 +08:00
|
|
|
} else if supportsAES {
|
2022-04-29 12:09:04 +08:00
|
|
|
expandKeyAsm(&key[0], &ck[0], &enc[0], &dec[0], INST_AES)
|
2022-01-21 11:24:10 +08:00
|
|
|
} else {
|
|
|
|
expandKeyGo(key, enc, dec)
|
|
|
|
}
|
|
|
|
}
|