66 const float *loop_end =
src + count;
77 "lw %[temp0], 0(%[src]) \n\t"
78 "lw %[temp1], 4(%[src]) \n\t"
79 "lw %[temp2], 8(%[src]) \n\t"
80 "lw %[temp3], 12(%[src]) \n\t"
81 "lw %[temp4], 16(%[src]) \n\t"
82 "lw %[temp5], 20(%[src]) \n\t"
83 "lw %[temp6], 24(%[src]) \n\t"
84 "lw %[temp7], 28(%[src]) \n\t"
86 "sw %[temp0], 0(%[dst]) \n\t"
87 "sw %[temp1], 4(%[dst]) \n\t"
88 "sw %[temp2], 8(%[dst]) \n\t"
89 "sw %[temp3], 12(%[dst]) \n\t"
90 "sw %[temp4], 16(%[dst]) \n\t"
91 "sw %[temp5], 20(%[dst]) \n\t"
92 "sw %[temp6], 24(%[dst]) \n\t"
93 "sw %[temp7], 28(%[dst]) \n\t"
94 "bne %[src], %[loop_end], 1b \n\t"
98 : [temp0]
"=&r"(
temp[0]), [temp1]
"=&r"(
temp[1]),
99 [temp2]
"=&r"(
temp[2]), [temp3]
"=&r"(
temp[3]),
100 [temp4]
"=&r"(
temp[4]), [temp5]
"=&r"(
temp[5]),
101 [temp6]
"=&r"(
temp[6]), [temp7]
"=&r"(
temp[7]),
102 [
src]
"+r"(
src), [dst]
"+r"(dst)
103 : [loop_end]
"r"(loop_end)
110 union {
unsigned u;
int s; } v = { previous_val * 1664525u + 1013904223 };
119 float *saved = sce->
saved;
127 for (
i = 0;
i < 1024;
i += 128)
142 float_copy(
out, saved, 448);
149 float temp0, temp1, temp2, temp3;
150 float *dst0 =
out + 448 + 0*128;
151 float *dst1 = dst0 + 64 + 63;
152 float *dst2 = saved + 63;
153 float *win0 = (
float*)swindow;
154 float *win1 = win0 + 64 + 63;
155 float *win0_prev = (
float*)swindow_prev;
156 float *win1_prev = win0_prev + 64 + 63;
157 float *src0_prev = saved + 448;
158 float *src1_prev = buf + 0*128 + 63;
159 float *
src0 = buf + 0*128 + 64;
160 float *
src1 = buf + 1*128 + 63;
162 for(
i = 0;
i < 64;
i++)
164 temp0 = src0_prev[0];
165 temp1 = src1_prev[0];
170 dst0[0] = temp0 * wj - temp1 * wi;
171 dst1[0] = temp0 * wi + temp1 * wj;
178 dst0[128] = temp2 * wj - temp3 * wi;
179 dst1[128] = temp2 * wi + temp3 * wj;
183 dst0[256] = temp0 * wj - temp1 * wi;
184 dst1[256] = temp0 * wi + temp1 * wj;
185 dst0[384] = temp2 * wj - temp3 * wi;
186 dst1[384] = temp2 * wi + temp3 * wj;
190 dst0[512] = temp0 * wj - temp1 * wi;
191 dst2[0] = temp0 * wi + temp1 * wj;
208 float_copy(
out + 576, buf + 64, 448);
217 float_copy(saved + 448, buf + 7*128 + 64, 64);
219 float_copy(saved, buf + 512, 448);
220 float_copy(saved + 448, buf + 7*128 + 64, 64);
222 float_copy(saved, buf + 512, 512);
234 float *predTime = sce->
ret;
237 int16_t num_samples = 2048;
240 num_samples = ltp->
lag + 1024;
241 j = (2048 - num_samples) >> 2;
242 k = (2048 - num_samples) & 3;
243 p_predTime = &predTime[num_samples];
245 for (
i = 0;
i < num_samples;
i++)
251 "sw $0, 0(%[p_predTime]) \n\t"
252 "sw $0, 4(%[p_predTime]) \n\t"
253 "sw $0, 8(%[p_predTime]) \n\t"
254 "sw $0, 12(%[p_predTime]) \n\t"
255 PTR_ADDIU "%[p_predTime], %[p_predTime], 16 \n\t"
257 : [p_predTime]
"+r"(p_predTime)
262 for (
i = 0;
i < k;
i++) {
265 "sw $0, 0(%[p_predTime]) \n\t"
266 PTR_ADDIU "%[p_predTime], %[p_predTime], 4 \n\t"
268 : [p_predTime]
"+r"(p_predTime)
298 for (; count > 0; count -= 4){
303 "lwc1 %[temp0], 0(%[ptr2]) \n\t"
304 "lwc1 %[temp1], -4(%[ptr2]) \n\t"
305 "lwc1 %[temp2], -8(%[ptr2]) \n\t"
306 "lwc1 %[temp3], -12(%[ptr2]) \n\t"
307 "lwc1 %[temp4], 0(%[ptr3]) \n\t"
308 "lwc1 %[temp5], -4(%[ptr3]) \n\t"
309 "lwc1 %[temp6], -8(%[ptr3]) \n\t"
310 "lwc1 %[temp7], -12(%[ptr3]) \n\t"
311 "mul.s %[temp8], %[temp0], %[temp4] \n\t"
312 "mul.s %[temp9], %[temp1], %[temp5] \n\t"
313 "mul.s %[temp10], %[temp2], %[temp6] \n\t"
314 "mul.s %[temp11], %[temp3], %[temp7] \n\t"
315 "swc1 %[temp8], 0(%[ptr1]) \n\t"
316 "swc1 %[temp9], 4(%[ptr1]) \n\t"
317 "swc1 %[temp10], 8(%[ptr1]) \n\t"
318 "swc1 %[temp11], 12(%[ptr1]) \n\t"
323 : [temp0]
"=&f"(
temp[0]), [temp1]
"=&f"(
temp[1]),
324 [temp2]
"=&f"(
temp[2]), [temp3]
"=&f"(
temp[3]),
325 [temp4]
"=&f"(
temp[4]), [temp5]
"=&f"(
temp[5]),
326 [temp6]
"=&f"(
temp[6]), [temp7]
"=&f"(
temp[7]),
327 [temp8]
"=&f"(
temp[8]), [temp9]
"=&f"(
temp[9]),
328 [temp10]
"=&f"(
temp[10]), [temp11]
"=&f"(
temp[11]),
329 [ptr1]
"+r"(dst), [ptr2]
"+r"(
src0), [ptr3]
"+r"(
src1)
339 float *saved = sce->
saved;
340 float *saved_ltp = sce->
coeffs;
343 uint32_t temp0, temp1, temp2, temp3, temp4, temp5, temp6, temp7;
346 float *p_saved_ltp = saved_ltp + 576;
347 float *loop_end1 = p_saved_ltp + 448;
349 float_copy(saved_ltp, saved, 512);
354 "sw $0, 0(%[p_saved_ltp]) \n\t"
355 "sw $0, 4(%[p_saved_ltp]) \n\t"
356 "sw $0, 8(%[p_saved_ltp]) \n\t"
357 "sw $0, 12(%[p_saved_ltp]) \n\t"
358 "sw $0, 16(%[p_saved_ltp]) \n\t"
359 "sw $0, 20(%[p_saved_ltp]) \n\t"
360 "sw $0, 24(%[p_saved_ltp]) \n\t"
361 "sw $0, 28(%[p_saved_ltp]) \n\t"
362 PTR_ADDIU "%[p_saved_ltp],%[p_saved_ltp], 32 \n\t"
363 "bne %[p_saved_ltp], %[loop_end1], 1b \n\t"
365 : [p_saved_ltp]
"+r"(p_saved_ltp)
366 : [loop_end1]
"r"(loop_end1)
371 fmul_and_reverse(saved_ltp + 512, ac->
buf_mdct + 960, swindow, 64);
373 float *buff0 = saved;
374 float *buff1 = saved_ltp;
375 float *loop_end = saved + 448;
380 ".set noreorder \n\t"
382 "lw %[temp0], 0(%[src]) \n\t"
383 "lw %[temp1], 4(%[src]) \n\t"
384 "lw %[temp2], 8(%[src]) \n\t"
385 "lw %[temp3], 12(%[src]) \n\t"
386 "lw %[temp4], 16(%[src]) \n\t"
387 "lw %[temp5], 20(%[src]) \n\t"
388 "lw %[temp6], 24(%[src]) \n\t"
389 "lw %[temp7], 28(%[src]) \n\t"
391 "sw %[temp0], 0(%[dst]) \n\t"
392 "sw %[temp1], 4(%[dst]) \n\t"
393 "sw %[temp2], 8(%[dst]) \n\t"
394 "sw %[temp3], 12(%[dst]) \n\t"
395 "sw %[temp4], 16(%[dst]) \n\t"
396 "sw %[temp5], 20(%[dst]) \n\t"
397 "sw %[temp6], 24(%[dst]) \n\t"
398 "sw %[temp7], 28(%[dst]) \n\t"
399 "sw $0, 2304(%[dst]) \n\t"
400 "sw $0, 2308(%[dst]) \n\t"
401 "sw $0, 2312(%[dst]) \n\t"
402 "sw $0, 2316(%[dst]) \n\t"
403 "sw $0, 2320(%[dst]) \n\t"
404 "sw $0, 2324(%[dst]) \n\t"
405 "sw $0, 2328(%[dst]) \n\t"
406 "sw $0, 2332(%[dst]) \n\t"
407 "bne %[src], %[loop_end], 1b \n\t"
411 : [temp0]
"=&r"(temp0), [temp1]
"=&r"(temp1),
412 [temp2]
"=&r"(temp2), [temp3]
"=&r"(temp3),
413 [temp4]
"=&r"(temp4), [temp5]
"=&r"(temp5),
414 [temp6]
"=&r"(temp6), [temp7]
"=&r"(temp7),
415 [
src]
"+r"(buff0), [dst]
"+r"(buff1)
416 : [loop_end]
"r"(loop_end)
420 fmul_and_reverse(saved_ltp + 512, ac->
buf_mdct + 960, swindow, 64);
423 fmul_and_reverse(saved_ltp + 512, ac->
buf_mdct + 512, lwindow, 512);
428 float_copy(sce->
ltp_state + 2048, saved_ltp, 1024);
437 c->imdct_and_windowing = imdct_and_windowing_mips;
438 c->apply_ltp = apply_ltp_mips;
439 c->update_ltp = update_ltp_mips;
AAC definitions and structures.
void ff_aacdec_init_mips(AACContext *c)
Reference: libavcodec/aacdec.c.
static av_always_inline int lcg_random(unsigned previous_val)
linear congruential pseudorandom number generator
float ff_aac_kbd_long_1024[1024]
float ff_aac_kbd_short_128[128]
MIPS assembly defines from sys/asm.h but rewritten for use with C inline assembly (rather than from w...
__asm__(".macro parse_r var r\n\t" "\\var = -1\n\t" _IFC_REG(0) _IFC_REG(1) _IFC_REG(2) _IFC_REG(3) _IFC_REG(4) _IFC_REG(5) _IFC_REG(6) _IFC_REG(7) _IFC_REG(8) _IFC_REG(9) _IFC_REG(10) _IFC_REG(11) _IFC_REG(12) _IFC_REG(13) _IFC_REG(14) _IFC_REG(15) _IFC_REG(16) _IFC_REG(17) _IFC_REG(18) _IFC_REG(19) _IFC_REG(20) _IFC_REG(21) _IFC_REG(22) _IFC_REG(23) _IFC_REG(24) _IFC_REG(25) _IFC_REG(26) _IFC_REG(27) _IFC_REG(28) _IFC_REG(29) _IFC_REG(30) _IFC_REG(31) ".iflt \\var\n\t" ".error \"Unable to parse register name \\r\"\n\t" ".endif\n\t" ".endm")
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> in
#define av_assert2(cond)
assert() equivalent, that does lie in speed critical code.
#define u(width, name, range_min, range_max)
static const int offsets[]
void(* apply_tns)(INTFLOAT coef[1024], TemporalNoiseShaping *tns, IndividualChannelStream *ics, int decode)
void(* windowing_and_mdct_ltp)(AACContext *ac, INTFLOAT *out, INTFLOAT *in, IndividualChannelStream *ics)
void(* vector_fmul_reverse)(float *dst, const float *src0, const float *src1, int len)
Calculate the entry wise product of two vectors of floats, and store the result in a vector of floats...
void(* vector_fmul_window)(float *dst, const float *src0, const float *src1, const float *win, int len)
Overlap/add with window function.
void(* imdct_half)(struct FFTContext *s, FFTSample *output, const FFTSample *input)
Individual Channel Stream.
uint8_t max_sfb
number of scalefactor bands per group
uint8_t use_kb_window[2]
If set, use Kaiser-Bessel window, otherwise use a sine window.
enum WindowSequence window_sequence[2]
const uint16_t * swb_offset
table of offsets to the lowest spectral coefficient of a scalefactor band, sfb, for a particular wind...
int8_t used[MAX_LTP_LONG_SFB]
Single Channel Element - used for both SCE and LFE elements.
INTFLOAT * ret
PCM output.
INTFLOAT coeffs[1024]
coefficients for IMDCT, maybe processed
INTFLOAT saved[1536]
overlap
INTFLOAT ltp_state[3072]
time signal for LTP
IndividualChannelStream ics