mirror of
https://github.com/raspberrypi/linux.git
synced 2025-12-19 00:04:18 +00:00
Instantiate crc-pclmul-template.S for crc_t10dif and delete the original
PCLMULQDQ optimized implementation. This has the following advantages:
- Less CRC-variant-specific code.
- VPCLMULQDQ support, greatly improving performance on sufficiently long
messages on newer CPUs.
- A faster reduction from 128 bits to the final CRC.
- Support for i386.
Benchmark results on AMD Ryzen 9 9950X (Zen 5) using crc_kunit:
Length Before After
------ ------ -----
1 440 MB/s 386 MB/s
16 1865 MB/s 2008 MB/s
64 4343 MB/s 6917 MB/s
127 5440 MB/s 8909 MB/s
128 5533 MB/s 12150 MB/s
200 5908 MB/s 14423 MB/s
256 15870 MB/s 21288 MB/s
511 14219 MB/s 25840 MB/s
512 18361 MB/s 37797 MB/s
1024 19941 MB/s 61374 MB/s
3173 20461 MB/s 74909 MB/s
4096 21310 MB/s 78919 MB/s
16384 21663 MB/s 85012 MB/s
Acked-by: Ard Biesheuvel <ardb@kernel.org>
Acked-by: Keith Busch <kbusch@kernel.org>
Reviewed-by: "Martin K. Petersen" <martin.petersen@oracle.com>
Link: https://lore.kernel.org/r/20250210174540.161705-6-ebiggers@kernel.org
Signed-off-by: Eric Biggers <ebiggers@google.com>
41 lines
915 B
C
41 lines
915 B
C
// SPDX-License-Identifier: GPL-2.0-or-later
|
|
/*
|
|
* CRC-T10DIF using [V]PCLMULQDQ instructions
|
|
*
|
|
* Copyright 2024 Google LLC
|
|
*/
|
|
|
|
#include <linux/crc-t10dif.h>
|
|
#include <linux/module.h>
|
|
#include "crc-pclmul-template.h"
|
|
|
|
static DEFINE_STATIC_KEY_FALSE(have_pclmulqdq);
|
|
|
|
DECLARE_CRC_PCLMUL_FUNCS(crc16_msb, u16);
|
|
|
|
u16 crc_t10dif_arch(u16 crc, const u8 *p, size_t len)
|
|
{
|
|
CRC_PCLMUL(crc, p, len, crc16_msb, crc16_msb_0x8bb7_consts,
|
|
have_pclmulqdq);
|
|
return crc_t10dif_generic(crc, p, len);
|
|
}
|
|
EXPORT_SYMBOL(crc_t10dif_arch);
|
|
|
|
static int __init crc_t10dif_x86_init(void)
|
|
{
|
|
if (boot_cpu_has(X86_FEATURE_PCLMULQDQ)) {
|
|
static_branch_enable(&have_pclmulqdq);
|
|
INIT_CRC_PCLMUL(crc16_msb);
|
|
}
|
|
return 0;
|
|
}
|
|
arch_initcall(crc_t10dif_x86_init);
|
|
|
|
static void __exit crc_t10dif_x86_exit(void)
|
|
{
|
|
}
|
|
module_exit(crc_t10dif_x86_exit);
|
|
|
|
MODULE_DESCRIPTION("CRC-T10DIF using [V]PCLMULQDQ instructions");
|
|
MODULE_LICENSE("GPL");
|