Commit 5c7c5108 authored by Laurent THOMAS's avatar Laurent THOMAS Committed by Robert Schmidt

remove useless macro, the SIMD instruction is used in other places

parent cb562c27
...@@ -126,11 +126,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -126,11 +126,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[0]>>4)+lut_idxCnProcG3[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[0]>>4)+lut_idxCnProcG3[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -142,11 +138,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -142,11 +138,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
// Store result // Store result
// min = simde_mm_min_epu8(min, maxLLR); // 128 in epi8 is -127 // min = simde_mm_min_epu8(min, maxLLR); // 128 in epi8 is -127
#ifndef DROP_MAXLLR #ifndef DROP_MAXLLR
...@@ -193,11 +185,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -193,11 +185,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[1]>>4)+lut_idxCnProcG4[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[1]>>4)+lut_idxCnProcG4[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -211,11 +199,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -211,11 +199,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -268,11 +252,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -268,11 +252,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[2]>>4)+lut_idxCnProcG5[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[2]>>4)+lut_idxCnProcG5[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -286,11 +266,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -286,11 +266,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -343,11 +319,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -343,11 +319,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[3]>>4)+lut_idxCnProcG6[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[3]>>4)+lut_idxCnProcG6[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -361,11 +333,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -361,11 +333,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -421,11 +389,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -421,11 +389,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[4]>>4)+lut_idxCnProcG7[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[4]>>4)+lut_idxCnProcG7[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -439,11 +403,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -439,11 +403,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -500,11 +460,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -500,11 +460,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[5]>>4)+lut_idxCnProcG8[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[5]>>4)+lut_idxCnProcG8[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -518,11 +474,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -518,11 +474,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -579,11 +531,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -579,11 +531,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[6]>>4)+lut_idxCnProcG9[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[6]>>4)+lut_idxCnProcG9[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -597,11 +545,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -597,11 +545,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -659,11 +603,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -659,11 +603,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[7]>>4)+lut_idxCnProcG10[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[7]>>4)+lut_idxCnProcG10[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -677,11 +617,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -677,11 +617,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -742,11 +678,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -742,11 +678,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[8]>>4)+lut_idxCnProcG19[j][0]*2); fprintf(fd," ymm0 = ((simde__m128i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[8]>>4)+lut_idxCnProcG19[j][0]*2);
// sgn = simde_mm_sign_epi8(ones, ymm0); // sgn = simde_mm_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(ones, ymm0);\n");
#endif
// min = simde_mm_abs_epi8(ymm0); // min = simde_mm_abs_epi8(ymm0);
fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm_abs_epi8(ymm0);\n");
...@@ -760,11 +692,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R) ...@@ -760,11 +692,7 @@ void nrLDPC_cnProc_BG1_generator_128(const char* dir, int R)
fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm_min_epu8(min, simde_mm_abs_epi8(ymm0));\n");
// sgn = simde_mm_sign_epi8(sgn, ymm0); // sgn = simde_mm_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm_xor_si128(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
......
...@@ -128,11 +128,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -128,11 +128,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[0]>>5)+lut_idxCnProcG3[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[0]>>5)+lut_idxCnProcG3[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -144,11 +140,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -144,11 +140,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
// Store result // Store result
// min = simde_mm256_min_epu8(min, maxLLR); // 128 in epi8 is -127 // min = simde_mm256_min_epu8(min, maxLLR); // 128 in epi8 is -127
#ifndef DROP_MAXLLR #ifndef DROP_MAXLLR
...@@ -195,11 +187,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -195,11 +187,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[1]>>5)+lut_idxCnProcG4[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[1]>>5)+lut_idxCnProcG4[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -213,11 +201,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -213,11 +201,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -270,11 +254,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -270,11 +254,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[2]>>5)+lut_idxCnProcG5[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[2]>>5)+lut_idxCnProcG5[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -288,11 +268,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -288,11 +268,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -345,11 +321,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -345,11 +321,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[3]>>5)+lut_idxCnProcG6[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[3]>>5)+lut_idxCnProcG6[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -363,11 +335,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -363,11 +335,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -423,11 +391,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -423,11 +391,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[4]>>5)+lut_idxCnProcG7[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[4]>>5)+lut_idxCnProcG7[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -441,11 +405,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -441,11 +405,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -502,11 +462,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -502,11 +462,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[5]>>5)+lut_idxCnProcG8[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[5]>>5)+lut_idxCnProcG8[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -520,11 +476,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -520,11 +476,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -581,11 +533,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -581,11 +533,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[6]>>5)+lut_idxCnProcG9[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[6]>>5)+lut_idxCnProcG9[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -599,11 +547,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -599,11 +547,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -661,11 +605,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -661,11 +605,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[7]>>5)+lut_idxCnProcG10[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[7]>>5)+lut_idxCnProcG10[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -679,11 +619,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -679,11 +619,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
...@@ -744,11 +680,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -744,11 +680,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i]; // ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[8]>>5)+lut_idxCnProcG19[j][0]); fprintf(fd," ymm0 = ((simde__m256i*)cnProcBuf)[%d+i];\n",(lut_startAddrCnGroups[8]>>5)+lut_idxCnProcG19[j][0]);
// sgn = simde_mm256_sign_epi8(ones, ymm0); // sgn = simde_mm256_sign_epi8(ones, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(ones, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(ones, ymm0);\n");
#endif
// min = simde_mm256_abs_epi8(ymm0); // min = simde_mm256_abs_epi8(ymm0);
fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n"); fprintf(fd," min = simde_mm256_abs_epi8(ymm0);\n");
...@@ -762,11 +694,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R) ...@@ -762,11 +694,7 @@ void nrLDPC_cnProc_BG1_generator_AVX2(const char* dir, int R)
fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n"); fprintf(fd," min = simde_mm256_min_epu8(min, simde_mm256_abs_epi8(ymm0));\n");
// sgn = simde_mm256_sign_epi8(sgn, ymm0); // sgn = simde_mm256_sign_epi8(sgn, ymm0);
#ifndef AVOID_MM256_SIGN
fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n"); fprintf(fd," sgn = simde_mm256_sign_epi8(sgn, ymm0);\n");
#else
fprintf(fd," sgn = simde_mm256_xor_si256(sgn, ymm0);\n");
#endif
} }
// Store result // Store result
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment