Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
O
OpenXG-RAN
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
spbro
OpenXG-RAN
Commits
baf02b8d
Commit
baf02b8d
authored
Aug 27, 2024
by
Robert Schmidt
Browse files
Options
Browse Files
Download
Plain Diff
Merge remote-tracking branch 'origin/speedup_rotate_cpx_vector' into integration_2024_w34
parents
2ec8fefb
aa9183c2
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
16 additions
and
11 deletions
+16
-11
openair1/PHY/TOOLS/cmult_sv.c
openair1/PHY/TOOLS/cmult_sv.c
+16
-11
No files found.
openair1/PHY/TOOLS/cmult_sv.c
View file @
baf02b8d
...
...
@@ -160,7 +160,6 @@ void rotate_cpx_vector(const c16_t *const x, const c16_t *const alpha, c16_t *y,
int32_t
*
xd
=
(
int32_t
*
)
x
;
simde__m128i
shift
=
simde_mm_cvtsi32_si128
(
output_shift
);
register
simd_q15_t
m0
,
m1
,
m2
,
m3
;
((
int16_t
*
)
&
alpha_128
)[
0
]
=
alpha
->
r
;
((
int16_t
*
)
&
alpha_128
)[
1
]
=
-
alpha
->
i
;
...
...
@@ -174,17 +173,23 @@ void rotate_cpx_vector(const c16_t *const x, const c16_t *const alpha, c16_t *y,
for
(
i
=
0
;
i
<
N
>>
2
;
i
++
)
{
m0
=
simde_mm_setr_epi32
(
xd
[
0
],
xd
[
0
],
xd
[
1
],
xd
[
1
]);
m1
=
simde_mm_setr_epi32
(
xd
[
2
],
xd
[
2
],
xd
[
3
],
xd
[
3
]);
m2
=
simde_mm_madd_epi16
(
m0
,
alpha_128
);
//complex multiply. result is 32bit [Re Im Re Im]
m3
=
simde_mm_madd_epi16
(
m1
,
alpha_128
);
//complex multiply. result is 32bit [Re Im Re Im]
m2
=
simde_mm_sra_epi32
(
m2
,
shift
);
// shift right by shift in order to compensate for the input amplitude
m3
=
simde_mm_sra_epi32
(
m3
,
shift
);
// shift right by shift in order to compensate for the input amplitude
y_128
[
0
]
=
simde_mm_packs_epi32
(
m2
,
m3
);
// pack in 16bit integers with saturation [re im re im re im re im]
y_128
[
i
]
=
simde_mm_packs_epi32
(
// pack in 16bit integers with saturation [re im re im re im re im]
simde_mm_sra_epi32
(
// shift right by shift in order to compensate for the input amplitude
simde_mm_madd_epi16
(
// complex multiply. result is 32bit [Re Im Re Im]
simde_mm_setr_epi32
(
xd
[
0
+
i
*
4
],
xd
[
0
+
i
*
4
],
xd
[
1
+
i
*
4
],
xd
[
1
+
i
*
4
]),
alpha_128
),
shift
),
simde_mm_sra_epi32
(
// shift right by shift in order to compensate for the input amplitude
simde_mm_madd_epi16
(
// complex multiply. result is 32bit [Re Im Re Im]
simde_mm_setr_epi32
(
xd
[
2
+
i
*
4
],
xd
[
2
+
i
*
4
],
xd
[
3
+
i
*
4
],
xd
[
3
+
i
*
4
]),
alpha_128
),
shift
)
);
//print_ints("y_128[0]=", &y_128[0]);
xd
+=
4
;
y_128
+=
1
;
}
#if defined(__x86__) || defined(__x86_64__)
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment