38 #define AMR_USE_16BIT_TABLES
65 float prediction_error[4];
79 float hpf_31_mem[2], hpf_400_mem[2];
103 for (i = 0; i < 4; i++)
146 for (i = 0; i < 9; i++)
147 isf_q[i] =
dico1_isf[ind[0]][i] * (1.0
f / (1 << 15));
149 for (i = 0; i < 7; i++)
150 isf_q[i + 9] =
dico2_isf[ind[1]][i] * (1.0
f / (1 << 15));
152 for (i = 0; i < 5; i++)
155 for (i = 0; i < 4; i++)
158 for (i = 0; i < 7; i++)
173 for (i = 0; i < 9; i++)
174 isf_q[i] =
dico1_isf[ind[0]][i] * (1.0
f / (1 << 15));
176 for (i = 0; i < 7; i++)
177 isf_q[i + 9] =
dico2_isf[ind[1]][i] * (1.0
f / (1 << 15));
179 for (i = 0; i < 3; i++)
180 isf_q[i] +=
dico21_isf[ind[2]][i] * (1.0
f / (1 << 15));
182 for (i = 0; i < 3; i++)
183 isf_q[i + 3] +=
dico22_isf[ind[3]][i] * (1.0
f / (1 << 15));
185 for (i = 0; i < 3; i++)
186 isf_q[i + 6] +=
dico23_isf[ind[4]][i] * (1.0
f / (1 << 15));
188 for (i = 0; i < 3; i++)
189 isf_q[i + 9] +=
dico24_isf[ind[5]][i] * (1.0
f / (1 << 15));
191 for (i = 0; i < 4; i++)
192 isf_q[i + 12] +=
dico25_isf[ind[6]][i] * (1.0
f / (1 << 15));
210 isf_q[i] +=
isf_mean[i] * (1.0f / (1 << 15));
227 for (k = 0; k < 3; k++) {
230 isp_q[k][i] = (1.0 - c) * isp4_past[i] + c * isp_q[3][i];
246 uint8_t *base_lag_int,
int subframe)
248 if (subframe == 0 || subframe == 2) {
249 if (pitch_index < 376) {
250 *lag_int = (pitch_index + 137) >> 2;
251 *lag_frac = pitch_index - (*lag_int << 2) + 136;
252 }
else if (pitch_index < 440) {
253 *lag_int = (pitch_index + 257 - 376) >> 1;
254 *lag_frac = (pitch_index - (*lag_int << 1) + 256 - 376) << 1;
257 *lag_int = pitch_index - 280;
261 *base_lag_int = av_clip(*lag_int - 8 - (*lag_frac < 0),
267 *lag_int = (pitch_index + 1) >> 2;
268 *lag_frac = pitch_index - (*lag_int << 2);
269 *lag_int += *base_lag_int;
279 uint8_t *base_lag_int,
int subframe,
enum Mode mode)
281 if (subframe == 0 || (subframe == 2 && mode !=
MODE_6k60)) {
282 if (pitch_index < 116) {
283 *lag_int = (pitch_index + 69) >> 1;
284 *lag_frac = (pitch_index - (*lag_int << 1) + 68) << 1;
286 *lag_int = pitch_index - 24;
290 *base_lag_int = av_clip(*lag_int - 8 - (*lag_frac < 0),
293 *lag_int = (pitch_index + 1) >> 1;
294 *lag_frac = (pitch_index - (*lag_int << 1)) << 1;
295 *lag_int += *base_lag_int;
311 int pitch_lag_int, pitch_lag_frac;
324 pitch_lag_int += pitch_lag_frac > 0;
330 pitch_lag_frac + (pitch_lag_frac > 0 ? 0 : 4),
335 if (amr_subframe->
ltp) {
339 ctx->
pitch_vector[i] = 0.18 * exc[i - 1] + 0.64 * exc[i] +
341 memcpy(exc, ctx->
pitch_vector, AMRWB_SFR_SIZE *
sizeof(
float));
346 #define BIT_STR(x,lsb,len) (((x) >> (lsb)) & ((1 << (len)) - 1))
349 #define BIT_POS(x, p) (((x) >> (p)) & 1)
368 out[0] =
BIT_POS(code, m) ? -pos : pos;
376 out[0] =
BIT_POS(code, 2*m) ? -pos0 : pos0;
377 out[1] =
BIT_POS(code, 2*m) ? -pos1 : pos1;
378 out[1] = pos0 > pos1 ? -out[1] : out[1];
383 int half_2p =
BIT_POS(code, 2*m - 1) << (m - 1);
386 m - 1, off + half_2p);
392 int half_4p, subhalf_2p;
393 int b_offset = 1 << (m - 1);
395 switch (
BIT_STR(code, 4*m - 2, 2)) {
397 half_4p =
BIT_POS(code, 4*m - 3) << (m - 1);
398 subhalf_2p =
BIT_POS(code, 2*m - 3) << (m - 2);
401 m - 2, off + half_4p + subhalf_2p);
403 m - 1, off + half_4p);
409 m - 1, off + b_offset);
415 m - 1, off + b_offset);
421 m - 1, off + b_offset);
428 int half_3p =
BIT_POS(code, 5*m - 1) << (m - 1);
431 m - 1, off + half_3p);
438 int b_offset = 1 << (m - 1);
440 int half_more =
BIT_POS(code, 6*m - 5) << (m - 1);
441 int half_other = b_offset - half_more;
443 switch (
BIT_STR(code, 6*m - 4, 2)) {
446 m - 1, off + half_more);
448 m - 1, off + half_more);
452 m - 1, off + half_other);
454 m - 1, off + half_more);
458 m - 1, off + half_other);
460 m - 1, off + half_more);
466 m - 1, off + b_offset);
481 const uint16_t *pulse_lo,
const enum Mode mode)
486 int spacing = (mode ==
MODE_6k60) ? 2 : 4;
491 for (i = 0; i < 2; i++)
495 for (i = 0; i < 4; i++)
499 for (i = 0; i < 4; i++)
503 for (i = 0; i < 2; i++)
505 for (i = 2; i < 4; i++)
509 for (i = 0; i < 4; i++)
513 for (i = 0; i < 4; i++)
515 ((int) pulse_hi[i] << 14), 4, 1);
518 for (i = 0; i < 2; i++)
520 ((int) pulse_hi[i] << 10), 4, 1);
521 for (i = 2; i < 4; i++)
523 ((int) pulse_hi[i] << 14), 4, 1);
527 for (i = 0; i < 4; i++)
529 ((int) pulse_hi[i] << 11), 4, 1);
535 for (i = 0; i < 4; i++)
537 int pos = (
FFABS(sig_pos[i][j]) - 1) * spacing + i;
539 fixed_vector[pos] += sig_pos[i][j] < 0 ? -1.0 : 1.0;
552 float *fixed_gain_factor,
float *pitch_gain)
557 *pitch_gain = gains[0] * (1.0f / (1 << 14));
558 *fixed_gain_factor = gains[1] * (1.0f / (1 << 11));
575 fixed_vector[i] -= fixed_vector[i - 1] * ctx->
tilt_coef;
579 fixed_vector[i] += fixed_vector[i - ctx->
pitch_lag_int] * 0.85;
591 float *f_vector,
float f_gain)
598 return (p_ener - f_ener) / (p_ener + f_ener);
612 float *fixed_vector,
float *buf)
628 if (ir_filter_nr < 2)
633 for (i = 0; i < 6; i++)
649 if (ir_filter_nr < 2) {
681 acc += (isf[i] - isf_past[i]) * (isf[i] - isf_past[i]);
685 return FFMAX(0.0, 1.25 - acc * 0.8 * 512);
700 float voice_fac,
float stab_fac)
702 float sm_fac = 0.5 * (1 - voice_fac) * stab_fac;
708 if (fixed_gain < *prev_tr_gain) {
709 g0 =
FFMIN(*prev_tr_gain, fixed_gain + fixed_gain *
710 (6226 * (1.0
f / (1 << 15))));
712 g0 =
FFMAX(*prev_tr_gain, fixed_gain *
713 (27536 * (1.0
f / (1 << 15))));
717 return sm_fac * g0 + (1 - sm_fac) * fixed_gain;
729 float cpe = 0.125 * (1 + voice_fac);
730 float last = fixed_vector[0];
732 fixed_vector[0] -= cpe * fixed_vector[1];
735 float cur = fixed_vector[i];
737 fixed_vector[i] -= cpe * (last + fixed_vector[i + 1]);
741 fixed_vector[AMRWB_SFR_SIZE - 1] -= cpe * last;
755 float fixed_gain,
const float *fixed_vector,
775 energy, AMRWB_SFR_SIZE);
791 static void de_emphasis(
float *out,
float *in,
float m,
float mem[1])
795 out[0] = in[0] + m * mem[0];
798 out[i] = in[i] + out[i - 1] * m;
800 mem[0] = out[AMRWB_SFR_SIZE - 1];
815 int int_part = 0, frac_part;
818 for (j = 0; j < o_size / 5; j++) {
819 out[i] = in[int_part];
823 for (k = 1; k < 5; k++) {
843 uint16_t hb_idx, uint8_t vad)
855 return av_clipf((1.0 -
FFMAX(0.0, tilt)) * (1.25 - 0.25 * wsp), 0.1, 1.0);
868 const float *synth_exc,
float hb_gain)
878 energy * hb_gain * hb_gain,
890 for (i = 7; i <
LP_ORDER - 2; i++) {
891 float prod = (diff_isf[i] - mean) * (diff_isf[i - lag] - mean);
906 float diff_isf[
LP_ORDER - 2], diff_mean;
907 float *diff_hi = diff_isf -
LP_ORDER + 1;
912 isf[LP_ORDER_16k - 1] = isf[LP_ORDER - 1];
915 for (i = 0; i < LP_ORDER - 2; i++)
916 diff_isf[i] = isf[i + 1] - isf[i];
919 for (i = 2; i < LP_ORDER - 2; i++)
920 diff_mean += diff_isf[i] * (1.0
f / (LP_ORDER - 4));
924 for (i = 0; i < 3; i++) {
927 if (corr_lag[i] > corr_lag[i_max_corr])
932 for (i = LP_ORDER - 1; i < LP_ORDER_16k - 1; i++)
933 isf[i] = isf[i - 1] + isf[i - 1 - i_max_corr]
934 - isf[i - 2 - i_max_corr];
937 est = 7965 + (isf[2] - isf[3] - isf[4]) / 6.0;
938 scale = 0.5 * (
FFMIN(est, 7600) - isf[LP_ORDER - 2]) /
939 (isf[LP_ORDER_16k - 2] - isf[LP_ORDER - 2]);
941 for (i = LP_ORDER - 1; i < LP_ORDER_16k - 1; i++)
942 diff_hi[i] = scale * (isf[i] - isf[i - 1]);
945 for (i = LP_ORDER; i < LP_ORDER_16k - 1; i++)
946 if (diff_hi[i] + diff_hi[i - 1] < 5.0) {
947 if (diff_hi[i] > diff_hi[i - 1]) {
948 diff_hi[i - 1] = 5.0 - diff_hi[i];
950 diff_hi[i] = 5.0 - diff_hi[i - 1];
953 for (i = LP_ORDER - 1; i < LP_ORDER_16k - 1; i++)
954 isf[i] = isf[i - 1] + diff_hi[i] * (1.0
f / (1 << 15));
957 for (i = 0; i < LP_ORDER_16k - 1; i++)
975 for (i = 0; i <
size; i++) {
976 out[i] = lpc[i] * fac;
993 const float *exc,
const float *isf,
const float *isf_past)
1037 memcpy(data, mem, HB_FIR_SIZE *
sizeof(
float));
1043 out[i] += data[i + j] * fir_coef[j];
1046 memcpy(mem, data + AMRWB_SFR_SIZE_16k, HB_FIR_SIZE *
sizeof(
float));
1069 int *got_frame_ptr,
AVPacket *avpkt)
1073 const uint8_t *buf = avpkt->
data;
1074 int buf_size = avpkt->
size;
1075 int expected_fr_size, header_size;
1078 float fixed_gain_factor;
1079 float *synth_fixed_vector;
1080 float synth_fixed_gain;
1081 float voice_fac, stab_fac;
1104 if (buf_size < expected_fr_size) {
1106 "Frame too small (%d bytes). Truncated file?\n", buf_size);
1144 for (sub = 0; sub < 4; sub++)
1147 for (sub = 0; sub < 4; sub++) {
1172 ctx->
tilt_coef = voice_fac * 0.25 + 0.25;
1183 voice_fac, stab_fac);
1202 AMRWB_SFR_SIZE_16k);
1227 sub_buf[i] = (sub_buf[i] + hb_samples[i]) * (1.0f / (1 << 15));
1240 return expected_fr_size;