Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
F
FFmpeg
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Wiki
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Container Registry
Model registry
Operate
Environments
Monitor
Incidents
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
libremedia
Tethys
FFmpeg
Commits
a58a0139
Commit
a58a0139
authored
12 years ago
by
Justin Ruggles
Browse files
Options
Downloads
Patches
Plain Diff
lavr: x86: optimized 2-channel fltp to s16 conversion
parent
90cc27f8
No related branches found
No related tags found
No related merge requests found
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
libavresample/x86/audio_convert.asm
+43
-0
43 additions, 0 deletions
libavresample/x86/audio_convert.asm
libavresample/x86/audio_convert_init.c
+9
-0
9 additions, 0 deletions
libavresample/x86/audio_convert_init.c
with
52 additions
and
0 deletions
libavresample/x86/audio_convert.asm
+
43
−
0
View file @
a58a0139
...
...
@@ -32,6 +32,7 @@ pf_s16_inv_scale: times 4 dd 0x38000000
pf_s16_scale:
times
4
dd
0x47000000
pb_shuf_unpack_even:
db
-
1
,
-
1
,
0
,
1
,
-
1
,
-
1
,
2
,
3
,
-
1
,
-
1
,
8
,
9
,
-
1
,
-
1
,
10
,
11
pb_shuf_unpack_odd:
db
-
1
,
-
1
,
4
,
5
,
-
1
,
-
1
,
6
,
7
,
-
1
,
-
1
,
12
,
13
,
-
1
,
-
1
,
14
,
15
pb_interleave_words:
SHUFFLE_MASK_W
0
,
4
,
1
,
5
,
2
,
6
,
3
,
7
SECTION
_TEXT
...
...
@@ -538,6 +539,48 @@ INIT_XMM avx
CONV_S16P_TO_FLT_6CH
%endif
;------------------------------------------------------------------------------
; void ff_conv_fltp_to_s16_2ch(int16_t *dst, float *const *src, int len,
; int channels);
;------------------------------------------------------------------------------
%macro CONV_FLTP_TO_S16_2CH 0
cglobal
conv_fltp_to_s16_2ch
,
3
,
4
,
3
,
ds
t
,
src0
,
len
,
src1
lea
lenq
,
[
4
*
lend
]
mov
src1q
,
[
src0q
+
gprsize
]
mov
src0q
,
[
src0q
]
add
ds
tq
,
lenq
add
src0q
,
lenq
add
src1q
,
lenq
neg
lenq
mova
m2
,
[
pf_s16_scale
]
%if cpuflag(ssse3)
mova
m3
,
[
pb_interleave_words
]
%endif
.loop:
mulps
m0
,
m2
,
[
src0q
+
lenq
]
; m0 = 0, 2, 4, 6
mulps
m1
,
m2
,
[
src1q
+
lenq
]
; m1 = 1, 3, 5, 7
cvtps2dq
m0
,
m0
cvtps2dq
m1
,
m1
%if cpuflag(ssse3)
packssdw
m0
,
m1
; m0 = 0, 2, 4, 6, 1, 3, 5, 7
pshufb
m0
,
m3
; m0 = 0, 1, 2, 3, 4, 5, 6, 7
%else
packssdw
m0
,
m0
; m0 = 0, 2, 4, 6, x, x, x, x
packssdw
m1
,
m1
; m1 = 1, 3, 5, 7, x, x, x, x
punpcklwd
m0
,
m1
; m0 = 0, 1, 2, 3, 4, 5, 6, 7
%endif
mova
[
ds
tq
+
lenq
],
m0
add
lenq
,
mmsize
jl
.loop
REP_RET
%endmacro
INIT_XMM
ss
e2
CONV_FLTP_TO_S16_2CH
INIT_XMM
ss
se3
CONV_FLTP_TO_S16_2CH
;-----------------------------------------------------------------------------
; void ff_conv_fltp_to_flt_6ch(float *dst, float *const *src, int len,
; int channels);
...
...
This diff is collapsed.
Click to expand it.
libavresample/x86/audio_convert_init.c
+
9
−
0
View file @
a58a0139
...
...
@@ -66,6 +66,11 @@ extern void ff_conv_s16p_to_flt_6ch_ssse3(float *dst, int16_t *const *src,
extern
void
ff_conv_s16p_to_flt_6ch_avx
(
float
*
dst
,
int16_t
*
const
*
src
,
int
len
,
int
channels
);
extern
void
ff_conv_fltp_to_s16_2ch_sse2
(
int16_t
*
dst
,
float
*
const
*
src
,
int
len
,
int
channels
);
extern
void
ff_conv_fltp_to_s16_2ch_ssse3
(
int16_t
*
dst
,
float
*
const
*
src
,
int
len
,
int
channels
);
extern
void
ff_conv_fltp_to_flt_6ch_mmx
(
float
*
dst
,
float
*
const
*
src
,
int
len
,
int
channels
);
extern
void
ff_conv_fltp_to_flt_6ch_sse4
(
float
*
dst
,
float
*
const
*
src
,
int
len
,
...
...
@@ -110,10 +115,14 @@ av_cold void ff_audio_convert_init_x86(AudioConvert *ac)
2
,
16
,
8
,
"SSE2"
,
ff_conv_s16p_to_flt_2ch_sse2
);
ff_audio_convert_set_func
(
ac
,
AV_SAMPLE_FMT_FLT
,
AV_SAMPLE_FMT_S16P
,
6
,
16
,
4
,
"SSE2"
,
ff_conv_s16p_to_flt_6ch_sse2
);
ff_audio_convert_set_func
(
ac
,
AV_SAMPLE_FMT_S16
,
AV_SAMPLE_FMT_FLTP
,
2
,
16
,
4
,
"SSE2"
,
ff_conv_fltp_to_s16_2ch_sse2
);
}
if
(
mm_flags
&
AV_CPU_FLAG_SSSE3
&&
HAVE_SSE
)
{
ff_audio_convert_set_func
(
ac
,
AV_SAMPLE_FMT_FLT
,
AV_SAMPLE_FMT_S16P
,
6
,
16
,
4
,
"SSSE3"
,
ff_conv_s16p_to_flt_6ch_ssse3
);
ff_audio_convert_set_func
(
ac
,
AV_SAMPLE_FMT_S16
,
AV_SAMPLE_FMT_FLTP
,
2
,
16
,
4
,
"SSSE3"
,
ff_conv_fltp_to_s16_2ch_ssse3
);
}
if
(
mm_flags
&
AV_CPU_FLAG_SSE4
&&
HAVE_SSE
)
{
ff_audio_convert_set_func
(
ac
,
AV_SAMPLE_FMT_FLT
,
AV_SAMPLE_FMT_S16
,
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment