Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
O
OpenXG-RAN
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
promise
OpenXG-RAN
Commits
a7e61374
Commit
a7e61374
authored
May 09, 2020
by
Raymond Knopp
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
unrolled 2 BNs case in generator
parent
581a9731
Changes
4
Hide whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
66 additions
and
9 deletions
+66
-9
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/cnProc_gen.c
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/cnProc_gen.c
+33
-6
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/cnProc_gen.o
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/cnProc_gen.o
+0
-0
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/gmon.out
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/gmon.out
+0
-0
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/ldpc_gen_files/nrLDPC_cnProc_BG1_Z384_13.c
...r/nrLDPC_tools/ldpc_gen_files/nrLDPC_cnProc_BG1_Z384_13.c
+33
-3
No files found.
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/cnProc_gen.c
View file @
a7e61374
...
@@ -92,7 +92,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -92,7 +92,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// for (i=0; i<M; i++,iprime++)
// for (i=0; i<M; i++,iprime++)
// {
// {
fprintf
(
fd
,
" for (int i=0;i<%d;i+
+
) {
\n
"
,
M
);
fprintf
(
fd
,
" for (int i=0;i<%d;i+
=2
) {
\n
"
,
M
);
// Abs and sign of 32 CNs (first BN)
// Abs and sign of 32 CNs (first BN)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf
(
fd
,
" ymm0 = ((__m256i*)cnProcBuf)[%d+i];
\n
"
,(
lut_startAddrCnGroups
[
0
]
>>
5
)
+
lut_idxCnProcG3
[
j
][
0
]);
fprintf
(
fd
,
" ymm0 = ((__m256i*)cnProcBuf)[%d+i];
\n
"
,(
lut_startAddrCnGroups
[
0
]
>>
5
)
+
lut_idxCnProcG3
[
j
][
0
]);
...
@@ -117,6 +117,32 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -117,6 +117,32 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// *p_cnProcBufResBit = _mm256_sign_epi8(min, sgn);
// *p_cnProcBufResBit = _mm256_sign_epi8(min, sgn);
// p_cnProcBufResBit++;
// p_cnProcBufResBit++;
fprintf
(
fd
,
" ((__m256i*)cnProcBufRes)[%d+i] = _mm256_sign_epi8(min, sgn);
\n
"
,(
lut_startAddrCnGroups
[
0
]
>>
5
)
+
(
j
*
bitOffsetInGroup
));
fprintf
(
fd
,
" ((__m256i*)cnProcBufRes)[%d+i] = _mm256_sign_epi8(min, sgn);
\n
"
,(
lut_startAddrCnGroups
[
0
]
>>
5
)
+
(
j
*
bitOffsetInGroup
));
// Abs and sign of 32 CNs (first BN)
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][0] + i];
fprintf
(
fd
,
" ymm0 = ((__m256i*)cnProcBuf)[%d+i];
\n
"
,(
lut_startAddrCnGroups
[
0
]
>>
5
)
+
lut_idxCnProcG3
[
j
][
0
]
+
1
);
// sgn = _mm256_sign_epi8(ones, ymm0);
fprintf
(
fd
,
" sgn = _mm256_sign_epi8(ones, ymm0);
\n
"
);
// min = _mm256_abs_epi8(ymm0);
fprintf
(
fd
,
" min = _mm256_abs_epi8(ymm0);
\n
"
);
// 32 CNs of second BN
// ymm0 = p_cnProcBuf[lut_idxCnProcG3[j][1] + i];
fprintf
(
fd
,
" ymm0 = ((__m256i*)cnProcBuf)[%d+i];
\n
"
,(
lut_startAddrCnGroups
[
0
]
>>
5
)
+
lut_idxCnProcG3
[
j
][
1
]
+
1
);
// min = _mm256_min_epu8(min, _mm256_abs_epi8(ymm0));
fprintf
(
fd
,
" min = _mm256_min_epu8(min, _mm256_abs_epi8(ymm0));
\n
"
);
// sgn = _mm256_sign_epi8(sgn, ymm0);
fprintf
(
fd
,
" sgn = _mm256_sign_epi8(sgn, ymm0);
\n
"
);
// Store result
// min = _mm256_min_epu8(min, maxLLR); // 128 in epi8 is -127
fprintf
(
fd
,
" min = _mm256_min_epu8(min, maxLLR);
\n
"
);
// *p_cnProcBufResBit = _mm256_sign_epi8(min, sgn);
// p_cnProcBufResBit++;
fprintf
(
fd
,
" ((__m256i*)cnProcBufRes)[%d+i] = _mm256_sign_epi8(min, sgn);
\n
"
,(
lut_startAddrCnGroups
[
0
]
>>
5
)
+
(
j
*
bitOffsetInGroup
)
+
1
);
fprintf
(
fd
,
" }
\n
"
);
fprintf
(
fd
,
" }
\n
"
);
}
}
}
}
...
@@ -250,7 +276,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -250,7 +276,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// =====================================================================
// =====================================================================
// Process group with 6 BNs
// Process group with 6 BNs
fprintf
(
fd
,
"//Process group with 6 BNs
\n
"
);
// Offset is 8*384/32 = 96
// Offset is 8*384/32 = 96
const
uint16_t
lut_idxCnProcG6
[
6
][
5
]
=
{{
96
,
192
,
288
,
384
,
480
},
{
0
,
192
,
288
,
384
,
480
},
const
uint16_t
lut_idxCnProcG6
[
6
][
5
]
=
{{
96
,
192
,
288
,
384
,
480
},
{
0
,
192
,
288
,
384
,
480
},
{
0
,
96
,
288
,
384
,
480
},
{
0
,
96
,
192
,
384
,
480
},
{
0
,
96
,
288
,
384
,
480
},
{
0
,
96
,
192
,
384
,
480
},
...
@@ -316,7 +342,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -316,7 +342,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// =====================================================================
// =====================================================================
// Process group with 7 BNs
// Process group with 7 BNs
fprintf
(
fd
,
"//Process group with 7 BNs
\n
"
);
// Offset is 5*384/32 = 60
// Offset is 5*384/32 = 60
const
uint16_t
lut_idxCnProcG7
[
7
][
6
]
=
{{
60
,
120
,
180
,
240
,
300
,
360
},
{
0
,
120
,
180
,
240
,
300
,
360
},
const
uint16_t
lut_idxCnProcG7
[
7
][
6
]
=
{{
60
,
120
,
180
,
240
,
300
,
360
},
{
0
,
120
,
180
,
240
,
300
,
360
},
{
0
,
60
,
180
,
240
,
300
,
360
},
{
0
,
60
,
120
,
240
,
300
,
360
},
{
0
,
60
,
180
,
240
,
300
,
360
},
{
0
,
60
,
120
,
240
,
300
,
360
},
...
@@ -384,7 +410,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -384,7 +410,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// =====================================================================
// =====================================================================
// Process group with 8 BNs
// Process group with 8 BNs
fprintf
(
fd
,
"//Process group with 8 BNs
\n
"
);
// Offset is 2*384/32 = 24
// Offset is 2*384/32 = 24
const
uint8_t
lut_idxCnProcG8
[
8
][
7
]
=
{{
24
,
48
,
72
,
96
,
120
,
144
,
168
},
{
0
,
48
,
72
,
96
,
120
,
144
,
168
},
const
uint8_t
lut_idxCnProcG8
[
8
][
7
]
=
{{
24
,
48
,
72
,
96
,
120
,
144
,
168
},
{
0
,
48
,
72
,
96
,
120
,
144
,
168
},
{
0
,
24
,
72
,
96
,
120
,
144
,
168
},
{
0
,
24
,
48
,
96
,
120
,
144
,
168
},
{
0
,
24
,
72
,
96
,
120
,
144
,
168
},
{
0
,
24
,
48
,
96
,
120
,
144
,
168
},
...
@@ -452,7 +478,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -452,7 +478,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// =====================================================================
// =====================================================================
// Process group with 9 BNs
// Process group with 9 BNs
fprintf
(
fd
,
"//Process group with 9 BNs
\n
"
);
// Offset is 2*384/32 = 24
// Offset is 2*384/32 = 24
const
uint8_t
lut_idxCnProcG9
[
9
][
8
]
=
{{
24
,
48
,
72
,
96
,
120
,
144
,
168
,
192
},
{
0
,
48
,
72
,
96
,
120
,
144
,
168
,
192
},
const
uint8_t
lut_idxCnProcG9
[
9
][
8
]
=
{{
24
,
48
,
72
,
96
,
120
,
144
,
168
,
192
},
{
0
,
48
,
72
,
96
,
120
,
144
,
168
,
192
},
{
0
,
24
,
72
,
96
,
120
,
144
,
168
,
192
},
{
0
,
24
,
48
,
96
,
120
,
144
,
168
,
192
},
{
0
,
24
,
72
,
96
,
120
,
144
,
168
,
192
},
{
0
,
24
,
48
,
96
,
120
,
144
,
168
,
192
},
...
@@ -522,7 +548,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -522,7 +548,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// =====================================================================
// =====================================================================
// Process group with 10 BNs
// Process group with 10 BNs
fprintf
(
fd
,
"//Process group with 10 BNs
\n
"
);
// Offset is 1*384/32 = 12
// Offset is 1*384/32 = 12
const
uint8_t
lut_idxCnProcG10
[
10
][
9
]
=
{{
12
,
24
,
36
,
48
,
60
,
72
,
84
,
96
,
108
},
{
0
,
24
,
36
,
48
,
60
,
72
,
84
,
96
,
108
},
const
uint8_t
lut_idxCnProcG10
[
10
][
9
]
=
{{
12
,
24
,
36
,
48
,
60
,
72
,
84
,
96
,
108
},
{
0
,
24
,
36
,
48
,
60
,
72
,
84
,
96
,
108
},
{
0
,
12
,
36
,
48
,
60
,
72
,
84
,
96
,
108
},
{
0
,
12
,
24
,
48
,
60
,
72
,
84
,
96
,
108
},
{
0
,
12
,
36
,
48
,
60
,
72
,
84
,
96
,
108
},
{
0
,
12
,
24
,
48
,
60
,
72
,
84
,
96
,
108
},
...
@@ -593,6 +619,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
...
@@ -593,6 +619,7 @@ void nrLDPC_cnProc_BG1_generator(uint16_t Z,int R)
// =====================================================================
// =====================================================================
// Process group with 19 BNs
// Process group with 19 BNs
fprintf
(
fd
,
"//Process group with 19 BNs
\n
"
);
// Offset is 4*384/32 = 12
// Offset is 4*384/32 = 12
const
uint16_t
lut_idxCnProcG19
[
19
][
18
]
=
{{
48
,
96
,
144
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
{
0
,
96
,
144
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
const
uint16_t
lut_idxCnProcG19
[
19
][
18
]
=
{{
48
,
96
,
144
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
{
0
,
96
,
144
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
{
0
,
48
,
144
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
{
0
,
48
,
96
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
{
0
,
48
,
144
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
{
0
,
48
,
96
,
192
,
240
,
288
,
336
,
384
,
432
,
480
,
528
,
576
,
624
,
672
,
720
,
768
,
816
,
864
},
...
...
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/cnProc_gen.o
View file @
a7e61374
No preview for this file type
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/gmon.out
View file @
a7e61374
No preview for this file type
openair1/PHY/CODING/nrLDPC_decoder/nrLDPC_tools/ldpc_gen_files/nrLDPC_cnProc_BG1_Z384_13.c
View file @
a7e61374
...
@@ -5,7 +5,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -5,7 +5,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
__m256i
ymm0
,
min
,
sgn
,
ones
,
maxLLR
;
__m256i
ymm0
,
min
,
sgn
,
ones
,
maxLLR
;
ones
=
_mm256_set1_epi8
((
char
)
1
);
ones
=
_mm256_set1_epi8
((
char
)
1
);
maxLLR
=
_mm256_set1_epi8
((
char
)
127
);
maxLLR
=
_mm256_set1_epi8
((
char
)
127
);
for
(
int
i
=
0
;
i
<
12
;
i
+
+
)
{
for
(
int
i
=
0
;
i
<
12
;
i
+
=
2
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
12
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
12
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
...
@@ -14,8 +14,16 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -14,8 +14,16 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
0
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
0
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
13
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
25
+
i
];
min
=
_mm256_min_epu8
(
min
,
_mm256_abs_epi8
(
ymm0
));
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
1
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
for
(
int
i
=
0
;
i
<
12
;
i
+
+
)
{
for
(
int
i
=
0
;
i
<
12
;
i
+
=
2
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
0
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
0
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
...
@@ -24,8 +32,16 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -24,8 +32,16 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
12
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
12
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
1
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
25
+
i
];
min
=
_mm256_min_epu8
(
min
,
_mm256_abs_epi8
(
ymm0
));
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
13
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
for
(
int
i
=
0
;
i
<
12
;
i
+
+
)
{
for
(
int
i
=
0
;
i
<
12
;
i
+
=
2
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
0
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
0
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
...
@@ -34,6 +50,14 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -34,6 +50,14 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
24
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
24
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
1
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
min
=
_mm256_abs_epi8
(
ymm0
);
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
13
+
i
];
min
=
_mm256_min_epu8
(
min
,
_mm256_abs_epi8
(
ymm0
));
sgn
=
_mm256_sign_epi8
(
sgn
,
ymm0
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
25
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
//Process group with 4 BNs
//Process group with 4 BNs
for
(
int
i
=
0
;
i
<
60
;
i
++
)
{
for
(
int
i
=
0
;
i
<
60
;
i
++
)
{
...
@@ -169,6 +193,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -169,6 +193,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
1140
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
1140
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
//Process group with 6 BNs
for
(
int
i
=
0
;
i
<
96
;
i
++
)
{
for
(
int
i
=
0
;
i
<
96
;
i
++
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
1452
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
1452
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
...
@@ -283,6 +308,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -283,6 +308,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
1836
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
1836
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
//Process group with 7 BNs
for
(
int
i
=
0
;
i
<
60
;
i
++
)
{
for
(
int
i
=
0
;
i
<
60
;
i
++
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
1992
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
1992
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
...
@@ -437,6 +463,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -437,6 +463,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
2292
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
2292
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
//Process group with 8 BNs
for
(
int
i
=
0
;
i
<
24
;
i
++
)
{
for
(
int
i
=
0
;
i
<
24
;
i
++
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2376
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2376
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
...
@@ -637,6 +664,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -637,6 +664,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
2520
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
2520
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
//Process group with 9 BNs
for
(
int
i
=
0
;
i
<
24
;
i
++
)
{
for
(
int
i
=
0
;
i
<
24
;
i
++
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2568
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2568
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
...
@@ -889,6 +917,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -889,6 +917,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
2736
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
2736
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
//Process group with 10 BNs
for
(
int
i
=
0
;
i
<
12
;
i
++
)
{
for
(
int
i
=
0
;
i
<
12
;
i
++
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2772
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2772
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
...
@@ -1199,6 +1228,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
...
@@ -1199,6 +1228,7 @@ void nrLDPC_cnProc_BG1_Z384_13(int8_t* cnProcBuf,int8_t* cnProcBufRes) {
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
min
=
_mm256_min_epu8
(
min
,
maxLLR
);
((
__m256i
*
)
cnProcBufRes
)[
2868
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
((
__m256i
*
)
cnProcBufRes
)[
2868
+
i
]
=
_mm256_sign_epi8
(
min
,
sgn
);
}
}
//Process group with 19 BNs
for
(
int
i
=
0
;
i
<
48
;
i
++
)
{
for
(
int
i
=
0
;
i
<
48
;
i
++
)
{
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2928
+
i
];
ymm0
=
((
__m256i
*
)
cnProcBuf
)[
2928
+
i
];
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
sgn
=
_mm256_sign_epi8
(
ones
,
ymm0
);
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment