-rw-r--r-- 1296 libntruprime-20240825/src/core/weightsntrupP/avx/weight.c raw
#include <immintrin.h>
#include "crypto_core.h"
#include "crypto_int8.h"
#include "crypto_int16.h"
#define int8 crypto_int8
#define int16 crypto_int16
#include "crypto_encode_int16.h"
#include "params.h"
/* out = little-endian weight of bottom bits of in */
void crypto_core(unsigned char *outbytes,const unsigned char *inbytes,const unsigned char *kbytes,const unsigned char *cbytes)
{
int8 *in = (void *) inbytes;
int i;
__m256i sum,sumhi;
int16 weight;
sum = _mm256_loadu_si256((__m256i *) (in+p-32));
sum &= endingmask;
for (i = p-32;i >= 0;i -= 32) {
__m256i bits = _mm256_loadu_si256((__m256i *) in);
bits &= _mm256_set1_epi8(1);
sum = _mm256_add_epi8(sum,bits);
in += 32;
}
/* sum is 32xint8; want to add these int8 */
sumhi = _mm256_srli_epi16(sum,8);
sum &= _mm256_set1_epi16(0xff);
sum = _mm256_add_epi16(sum,sumhi);
/* sum is 16xint16; want to add these int16 */
sum = _mm256_hadd_epi16(sum,sum);
/* want sum[0]+sum[1]+sum[2]+sum[3]+sum[8]+sum[9]+sum[10]+sum[11] */
sum = _mm256_hadd_epi16(sum,sum);
/* want sum[0]+sum[1]+sum[8]+sum[9] */
sum = _mm256_hadd_epi16(sum,sum);
/* want sum[0]+sum[8] */
weight = _mm256_extract_epi16(sum,0);
weight += _mm256_extract_epi16(sum,8);
crypto_encode_int16(outbytes,&weight);
}