[dpdk-dev] [PATCH v5 1/2] librte_net: add crc compute APIs
De Lara Guarch, Pablo
pablo.de.lara.guarch at intel.com
Tue Mar 28 20:04:16 CEST 2017
Hi Jasvinder,
> -----Original Message-----
> From: Singh, Jasvinder
> Sent: Tuesday, March 21, 2017 2:46 PM
> To: dev at dpdk.org
> Cc: olivier.matz at 6wind.com; Doherty, Declan; De Lara Guarch, Pablo
> Subject: [PATCH v5 1/2] librte_net: add crc compute APIs
>
> APIs for selecting the architecure specific implementation and computing
> the crc (16-bit and 32-bit CRCs) are added. For CRCs calculation, scalar
> as well as x86 intrinsic(sse4.2) versions are implemented.
>
> The scalar version is based on generic Look-Up Table(LUT) algorithm,
> while x86 intrinsic version uses carry-less multiplication for
> fast CRC computation.
>
> Signed-off-by: Jasvinder Singh <jasvinder.singh at intel.com>
> ---
> diff --git a/lib/librte_net/rte_net_crc.c b/lib/librte_net/rte_net_crc.c
> new file mode 100644
> index 0000000..89edd80
> --- /dev/null
> +++ b/lib/librte_net/rte_net_crc.c
...
> +
> +#include <rte_net_crc.h>
> +#include <stddef.h>
> +
> +/** crc tables */
> +static uint32_t crc32_eth_lut[256];
> +static uint32_t crc16_ccitt_lut[256];
Use a macro for 256, that you can use in crc32_eth_init_lut.
> +
> +static uint32_t rte_crc16_ccitt_handler(const uint8_t *data,
> + uint32_t data_len);
Separate "static uint32_t" in another line.
> +/**
> + * Reflect the bits about the middle
> + *
> + * @param x value to be reflected
Should be "val".
> + *
> + * @return reflected value
> + */
> +static uint32_t
> +reflect_32bits(const uint32_t val)
No need for "const" here, as it is not a pointer.
> +{
> + uint32_t i, res = 0;
> +
> + for (i = 0; i < 32; i++)
> + if ((val & (1 << i)) != 0)
> + res |= (uint32_t)(1 << (31 - i));
> +
> + return res;
> +}
> +
> +static void
> +crc32_eth_init_lut(const uint32_t poly,
No need for "const" here.
> + uint32_t *lut)
> +{
> + uint_fast32_t i, j;
> +
> + for (i = 0; i < 256; i++) {
> + uint_fast32_t crc = reflect_32bits(i);
> +
> + for (j = 0; j < 8; j++) {
> + if (crc & 0x80000000L)
> + crc = (crc << 1) ^ poly;
> + else
> + crc <<= 1;
> + }
> + lut[i] = reflect_32bits(crc);
Wrong indentation.
> + }
> +}
> +
> +static inline __attribute__((always_inline)) uint32_t
> +crc32_eth_calc_lut(const uint8_t *data,
> + uint32_t data_len,
> + uint32_t crc,
> + const uint32_t *lut)
> +{
> + while (data_len--)
> + crc = lut[(crc ^ *data++) & 0xffL] ^ (crc >> 8);
> +
> + return crc;
> +}
> +
> +static void
> +rte_net_crc_scalar_init(void)
> +{
> + /** 32-bit crc init */
> + crc32_eth_init_lut(CRC32_ETH_POLYNOMIAL, crc32_eth_lut);
> +
> + /** 16-bit CRC init */
> + crc32_eth_init_lut(CRC16_CCITT_POLYNOMIAL << 16,
> crc16_ccitt_lut);
> +
Remove this blank line.
> +}
> +
> +static inline uint32_t
> +rte_crc16_ccitt_handler(const uint8_t *data, uint32_t data_len)
> +{
> + return (uint16_t)~crc32_eth_calc_lut(data,
> + data_len,
> + 0xffff,
> + crc16_ccitt_lut);
Since you are casting to uint16_t, when you are supposed to cast to uint32_t
(given the return type), I would add a comment explaining why.
> +}
> +
> diff --git a/lib/librte_net/rte_net_crc.h b/lib/librte_net/rte_net_crc.h
> new file mode 100644
> index 0000000..f8c9075
> --- /dev/null
> +++ b/lib/librte_net/rte_net_crc.h
> @@ -0,0 +1,101 @@
...
> +
> +/**
> + * This API set the crc computation algorithm (i.e. scalar version,
> + * x86 64-bit sse4.2 intrinsic version, etc.) and internal data
> + * structure.
> + *
> + * @param alg
Add extra information (CRC algorithm?).
> + * - RTE_NET_CRC_SCALAR
> + * - RTE_NET_CRC_SSE42 (Use 64-bit SSE4.2 intrinsic)
> + */
> +void
> +rte_net_crc_set_alg(enum rte_net_crc_alg alg);
> +
> +/**
> + * CRC compute API
> + *
> + * @param data
> + * Pointer to the packet data for crc computation
> + * @param data_len
> + * Data length for crc computation
> + * @param type
> + * Crc type (enum rte_net_crc_type)
CRC
> + *
> + * @return
> + * crc value
Add two spaces after "@param" and "@return".
> + */
> +uint32_t
> +rte_net_crc_calc(const void *data,
> + uint32_t data_len,
> + enum rte_net_crc_type type);
> +
> +#if defined(RTE_ARCH_X86_64) || defined(RTE_CPU_FALGS_SSE_4_2)
Typo in RTE_CPU_FALGS_SSE_4_2 (I missed the same one in rte_net_crc.c ).
Also, should it be "&&"?
> +#include <rte_net_crc_sse.h>
> +#endif
> +
> +#ifdef __cplusplus
> +}
> +#endif
> +
> +
> +#endif /* _RTE_NET_CRC_H_ */
> diff --git a/lib/librte_net/rte_net_crc_sse.h
> b/lib/librte_net/rte_net_crc_sse.h
> new file mode 100644
> index 0000000..e9af22d
> --- /dev/null
> +++ b/lib/librte_net/rte_net_crc_sse.h
> @@ -0,0 +1,345 @@
...
> + * @brief Performs one folding round
> + *
> + * Logically function operates as follows:
> + * DATA = READ_NEXT_16BYTES();
> + * F1 = LSB8(FOLD)
> + * F2 = MSB8(FOLD)
> + * T1 = CLMUL(F1, RK1)
> + * T2 = CLMUL(F2, RK2)
> + * FOLD = XOR(T1, T2, DATA)
> + *
> + * @param data_block 16 byte data block
> + * @param precomp precomputed rk1 constanst
> + * @param fold running 16 byte folded data
> + *
> + * @return New 16 byte folded data
Move parameter/rturn description in a separate line (same for other functions).
> + */
> +static inline __attribute__((always_inline)) __m128i
> +crcr32_folding_round(const __m128i data_block,
> + const __m128i precomp,
> + const __m128i fold)
No need to use "const" here.
> +{
> + __m128i tmp0 = _mm_clmulepi64_si128(fold, precomp, 0x01);
> + __m128i tmp1 = _mm_clmulepi64_si128(fold, precomp, 0x10);
> +
> + return _mm_xor_si128(tmp1, _mm_xor_si128(data_block, tmp0));
> +}
> +
> +/**
> + * Performs reduction from 128 bits to 64 bits
> + *
> + * @param data128 128 bits data to be reduced
> + * @param precomp rk5 and rk6 precomputed constants
> + *
> + * @return data reduced to 64 bits
> + */
> +
> +static inline __attribute__((always_inline)) __m128i
> +crcr32_reduce_128_to_64(__m128i data128,
> + const __m128i precomp)
No need to use "const" here.
...
> +
> +
> +static inline void
> +rte_net_crc_sse42_init(void)
> +{
> + uint64_t k1, k2, k5, k6;
> + uint64_t p = 0, q = 0;
> +
> + /** Initialize CRC16 data */
> + k1 = 0x189aeLLU;
> + k2 = 0x8e10LLU;
> + k5 = 0x189aeLLU;
> + k6 = 0x114aaLLU;
> + q = 0x11c581910LLU;
> + p = 0x10811LLU;
> +
> + /** Save the params in context structure */
> + crc16_ccitt_pclmulqdq.rk1_rk2 =
> + _mm_setr_epi64(_mm_cvtsi64_m64(k1),
> _mm_cvtsi64_m64(k2));
> + crc16_ccitt_pclmulqdq.rk5_rk6 =
> + _mm_setr_epi64(_mm_cvtsi64_m64(k5),
> _mm_cvtsi64_m64(k6));
> + crc16_ccitt_pclmulqdq.rk7_rk8 =
> + _mm_setr_epi64(_mm_cvtsi64_m64(q),
> _mm_cvtsi64_m64(p));
> +
> + /** Initialize CRC32 data */
> + k1 = 0xccaa009eLLU;
> + k2 = 0x1751997d0LLU;
> + k5 = 0xccaa009eLLU;
> + k6 = 0x163cd6124LLU;
> + q = 0x1f7011640LLU;
> + p = 0x1db710641LLU;
> +
> + /** Save the params in context structure */
> + crc32_eth_pclmulqdq.rk1_rk2 =
> + _mm_setr_epi64(_mm_cvtsi64_m64(k1),
> _mm_cvtsi64_m64(k2));
Add extra tab for better readability.
> + crc32_eth_pclmulqdq.rk5_rk6 =
> + _mm_setr_epi64(_mm_cvtsi64_m64(k5),
> _mm_cvtsi64_m64(k6));
> + crc32_eth_pclmulqdq.rk7_rk8 =
> + _mm_setr_epi64(_mm_cvtsi64_m64(q),
> _mm_cvtsi64_m64(p));
> +
> + _mm_empty();
Maybe we need a comment here.
> +
> +}
> +
> +static inline uint32_t
> +rte_crc16_ccitt_sse42_handler(const uint8_t *data,
> + uint32_t data_len)
> +{
> + return (uint16_t)~crc32_eth_calc_pclmulqdq(data,
> + data_len,
> + 0xffff,
> + &crc16_ccitt_pclmulqdq);
Same comment about the casting here.
> +}
> +
> +static inline uint32_t
> +rte_crc32_eth_sse42_handler(const uint8_t *data,
> + uint32_t data_len)
> +{
> + return ~crc32_eth_calc_pclmulqdq(data,
> + data_len,
> + 0xffffffffUL,
> + &crc32_eth_pclmulqdq);
> +}
> +
> +#ifdef __cplusplus
> +}
> +#endif
> +
> +#endif /* _RTE_NET_CRC_SSE_H_ */
> diff --git a/lib/librte_net/rte_net_version.map
> b/lib/librte_net/rte_net_version.map
> index 3b15e65..c6716ec 100644
> --- a/lib/librte_net/rte_net_version.map
> +++ b/lib/librte_net/rte_net_version.map
> @@ -4,3 +4,11 @@ DPDK_16.11 {
>
> local: *;
> };
> +
> +DPDK_17.05 {
> + global:
> +
> + rte_net_crc_set_alg;
> + rte_net_crc_calc;
This has to be alphabetically sorted.
> +
> +} DPDK_16.11;
> --
> 2.5.5
More information about the dev
mailing list