Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
O
OpenXG-RAN
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
spbro
OpenXG-RAN
Commits
aa9183c2
Commit
aa9183c2
authored
Aug 13, 2024
by
Matthias Mehlhose
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
mod: Improve signal processing speed of rotate_cpx_vector function
parent
871078a6
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
16 additions
and
11 deletions
+16
-11
openair1/PHY/TOOLS/cmult_sv.c
openair1/PHY/TOOLS/cmult_sv.c
+16
-11
No files found.
openair1/PHY/TOOLS/cmult_sv.c
View file @
aa9183c2
...
@@ -160,7 +160,6 @@ void rotate_cpx_vector(const c16_t *const x, const c16_t *const alpha, c16_t *y,
...
@@ -160,7 +160,6 @@ void rotate_cpx_vector(const c16_t *const x, const c16_t *const alpha, c16_t *y,
int32_t
*
xd
=
(
int32_t
*
)
x
;
int32_t
*
xd
=
(
int32_t
*
)
x
;
simde__m128i
shift
=
simde_mm_cvtsi32_si128
(
output_shift
);
simde__m128i
shift
=
simde_mm_cvtsi32_si128
(
output_shift
);
register
simd_q15_t
m0
,
m1
,
m2
,
m3
;
((
int16_t
*
)
&
alpha_128
)[
0
]
=
alpha
->
r
;
((
int16_t
*
)
&
alpha_128
)[
0
]
=
alpha
->
r
;
((
int16_t
*
)
&
alpha_128
)[
1
]
=
-
alpha
->
i
;
((
int16_t
*
)
&
alpha_128
)[
1
]
=
-
alpha
->
i
;
...
@@ -174,17 +173,23 @@ void rotate_cpx_vector(const c16_t *const x, const c16_t *const alpha, c16_t *y,
...
@@ -174,17 +173,23 @@ void rotate_cpx_vector(const c16_t *const x, const c16_t *const alpha, c16_t *y,
for
(
i
=
0
;
i
<
N
>>
2
;
i
++
)
{
for
(
i
=
0
;
i
<
N
>>
2
;
i
++
)
{
m0
=
simde_mm_setr_epi32
(
xd
[
0
],
xd
[
0
],
xd
[
1
],
xd
[
1
]);
y_128
[
i
]
=
simde_mm_packs_epi32
(
// pack in 16bit integers with saturation [re im re im re im re im]
m1
=
simde_mm_setr_epi32
(
xd
[
2
],
xd
[
2
],
xd
[
3
],
xd
[
3
]);
simde_mm_sra_epi32
(
// shift right by shift in order to compensate for the input amplitude
m2
=
simde_mm_madd_epi16
(
m0
,
alpha_128
);
//complex multiply. result is 32bit [Re Im Re Im]
simde_mm_madd_epi16
(
// complex multiply. result is 32bit [Re Im Re Im]
m3
=
simde_mm_madd_epi16
(
m1
,
alpha_128
);
//complex multiply. result is 32bit [Re Im Re Im]
simde_mm_setr_epi32
(
xd
[
0
+
i
*
4
],
xd
[
0
+
i
*
4
],
xd
[
1
+
i
*
4
],
xd
[
1
+
i
*
4
]),
m2
=
simde_mm_sra_epi32
(
m2
,
shift
);
// shift right by shift in order to compensate for the input amplitude
alpha_128
m3
=
simde_mm_sra_epi32
(
m3
,
shift
);
// shift right by shift in order to compensate for the input amplitude
),
shift
y_128
[
0
]
=
simde_mm_packs_epi32
(
m2
,
m3
);
// pack in 16bit integers with saturation [re im re im re im re im]
),
simde_mm_sra_epi32
(
// shift right by shift in order to compensate for the input amplitude
simde_mm_madd_epi16
(
// complex multiply. result is 32bit [Re Im Re Im]
simde_mm_setr_epi32
(
xd
[
2
+
i
*
4
],
xd
[
2
+
i
*
4
],
xd
[
3
+
i
*
4
],
xd
[
3
+
i
*
4
]),
alpha_128
),
shift
)
);
//print_ints("y_128[0]=", &y_128[0]);
//print_ints("y_128[0]=", &y_128[0]);
xd
+=
4
;
y_128
+=
1
;
}
}
#if defined(__x86__) || defined(__x86_64__)
#if defined(__x86__) || defined(__x86_64__)
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment