/****************************************************************************** * * * Copyright (C) 2018 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at: * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ***************************************************************************** * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore */ #include <float.h> #include <stdlib.h> #include <stdio.h> #include <math.h> #include <string.h> #include <ixheaacd_type_def.h> #include "ixheaacd_bitbuffer.h" #include "ixheaacd_interface.h" #include "ixheaacd_tns_usac.h" #include "ixheaacd_cnst.h" #include "ixheaacd_acelp_info.h" #include "ixheaacd_td_mdct.h" #include "ixheaacd_sbrdecsettings.h" #include "ixheaacd_info.h" #include "ixheaacd_sbr_common.h" #include "ixheaacd_drc_data_struct.h" #include "ixheaacd_drc_dec.h" #include "ixheaacd_sbrdecoder.h" #include "ixheaacd_mps_polyphase.h" #include "ixheaacd_sbr_const.h" #include "ixheaacd_main.h" #include "ixheaacd_arith_dec.h" #include "ixheaacd_func_def.h" #include "ixheaacd_acelp_com.h" #define F_PIT_SHARP 0.85F #define MEAN_ENER 30 extern const FLOAT32 ixheaacd_interpol_filt[INTER_LP_FIL_LEN]; VOID ixheaacd_acelp_pitch_sharpening(FLOAT32 *x, WORD32 pit_lag) { WORD32 i; for (i = pit_lag; i < LEN_SUBFR; i++) { x[i] += x[i - pit_lag] * F_PIT_SHARP; } return; } static VOID ixheaacd_acelp_decode_1sp_per_track(WORD32 idx_1p, WORD32 M, WORD32 ixheaacd_drc_offset, WORD32 track, FLOAT32 code_vec[]) { WORD32 sign_index, mask, m; WORD32 sp_pos; mask = ((1 << M) - 1); sp_pos = (idx_1p & mask) + ixheaacd_drc_offset; sign_index = ((idx_1p >> M) & 1); m = (sp_pos << 2) + track; if (sign_index == 1) code_vec[m] = (code_vec[m] - 1.0f); else code_vec[m] = (code_vec[m] + 1.0f); return; } static VOID ixheaacd_acelp_decode_2sp_per_track(WORD32 idx_2p, WORD32 M, WORD32 ixheaacd_drc_offset, WORD32 track, FLOAT32 code_vec[]) { WORD32 sign_index; WORD32 mask, m0, m1; WORD32 sp_pos[2]; mask = ((1 << M) - 1); sp_pos[0] = (((idx_2p >> M) & mask) + ixheaacd_drc_offset); sp_pos[1] = ((idx_2p & mask) + ixheaacd_drc_offset); sign_index = (idx_2p >> 2 * M) & 1; m0 = (sp_pos[0] << 2) + track; m1 = (sp_pos[1] << 2) + track; if ((sp_pos[1] - sp_pos[0]) < 0) { if (sign_index == 1) { code_vec[m0] = (code_vec[m0] - 1.0f); code_vec[m1] = (code_vec[m1] + 1.0f); } else { code_vec[m0] = (code_vec[m0] + 1.0f); code_vec[m1] = (code_vec[m1] - 1.0f); } } else { if (sign_index == 1) { code_vec[m0] = (code_vec[m0] - 1.0f); code_vec[m1] = (code_vec[m1] - 1.0f); } else { code_vec[m0] = (code_vec[m0] + 1.0f); code_vec[m1] = (code_vec[m1] + 1.0f); } } return; } static VOID ixheaacd_acelp_decode_3sp_per_track(WORD32 idx_3p, WORD32 M, WORD32 ixheaacd_drc_offset, WORD32 track, FLOAT32 code_vec[]) { WORD32 j, mask, idx_2p, idx_1p; mask = ((1 << (2 * M - 1)) - 1); idx_2p = idx_3p & mask; j = ixheaacd_drc_offset; if (((idx_3p >> ((2 * M) - 1)) & 1) == 1) { j += (1 << (M - 1)); } ixheaacd_acelp_decode_2sp_per_track(idx_2p, M - 1, j, track, code_vec); mask = ((1 << (M + 1)) - 1); idx_1p = (idx_3p >> 2 * M) & mask; ixheaacd_acelp_decode_1sp_per_track(idx_1p, M, ixheaacd_drc_offset, track, code_vec); return; } static VOID ixheaacd_d_acelp_decode_4sp_per_track_section( WORD32 index, WORD32 ixheaacd_drc_offset, WORD32 track, FLOAT32 code_vec[]) { WORD32 j, idx_2p; idx_2p = index & 31; j = ixheaacd_drc_offset; if (((index >> 5) & 1) == 1) { j += 4; } ixheaacd_acelp_decode_2sp_per_track(idx_2p, 2, j, track, code_vec); idx_2p = (index >> 6) & 127; ixheaacd_acelp_decode_2sp_per_track(idx_2p, 3, ixheaacd_drc_offset, track, code_vec); return; } static VOID ixheaacd_acelp_decode_4sp_per_track(WORD32 idx_4p, WORD32 track, FLOAT32 code_vec[]) { WORD32 idx_1p, idx_2p, idx_3p; switch ((idx_4p >> 14) & 3) { case 0: if (((idx_4p >> 13) & 1) == 0) ixheaacd_d_acelp_decode_4sp_per_track_section(idx_4p, 0, track, code_vec); else ixheaacd_d_acelp_decode_4sp_per_track_section(idx_4p, 8, track, code_vec); break; case 1: idx_1p = idx_4p >> 10; ixheaacd_acelp_decode_1sp_per_track(idx_1p, 3, 0, track, code_vec); ixheaacd_acelp_decode_3sp_per_track(idx_4p, 3, 8, track, code_vec); break; case 2: idx_2p = idx_4p >> 7; ixheaacd_acelp_decode_2sp_per_track(idx_2p, 3, 0, track, code_vec); ixheaacd_acelp_decode_2sp_per_track(idx_4p, 3, 8, track, code_vec); break; case 3: idx_3p = idx_4p >> 4; ixheaacd_acelp_decode_3sp_per_track(idx_3p, 3, 0, track, code_vec); ixheaacd_acelp_decode_1sp_per_track(idx_4p, 3, 8, track, code_vec); break; } return; } static VOID ixheaacd_d_acelp_add_pulse(WORD32 pos[], WORD32 nb_pulse, WORD32 track, FLOAT32 code[]) { WORD32 i, k; for (k = 0; k < nb_pulse; k++) { i = ((pos[k] & (16 - 1)) << 2) + track; if ((pos[k] & 16) == 0) { code[i] = (WORD16)(code[i] + 1.0f); } else { code[i] = (WORD16)(code[i] - 1.0f); } } return; } static VOID ixheaacd_d_acelp_decode_1p_n1(WORD32 index, WORD32 N, WORD32 ixheaacd_drc_offset, WORD32 pos[]) { WORD32 i, pos1, mask; mask = ((1 << N) - 1); pos1 = ((index & mask) + ixheaacd_drc_offset); i = ((index >> N) & 1); if (i == 1) { pos1 += 16; } pos[0] = pos1; return; } VOID ixheaacd_acelp_decode_pulses_per_track(WORD32 cb_index[], WORD16 code_bits, FLOAT32 code_vec[]) { WORD32 track_idx, index, ixheaacd_drc_offset, pos[6], i; memset(code_vec, 0, 64 * sizeof(FLOAT32)); if (code_bits == 12) { for (track_idx = 0; track_idx < 4; track_idx += 2) { ixheaacd_drc_offset = cb_index[2 * (track_idx / 2)]; index = cb_index[2 * (track_idx / 2) + 1]; ixheaacd_d_acelp_decode_1p_n1(index, 4, 0, pos); ixheaacd_d_acelp_add_pulse( pos, 1, 2 * ixheaacd_drc_offset + track_idx / 2, code_vec); } } else if (code_bits == 16) { i = 0; ixheaacd_drc_offset = cb_index[i++]; ixheaacd_drc_offset = (ixheaacd_drc_offset == 0) ? 1 : 3; for (track_idx = 0; track_idx < 4; track_idx++) { if (track_idx != ixheaacd_drc_offset) { index = cb_index[i++]; ixheaacd_d_acelp_decode_1p_n1(index, 4, 0, pos); ixheaacd_d_acelp_add_pulse(pos, 1, track_idx, code_vec); } } } else if (code_bits == 20) { for (track_idx = 0; track_idx < 4; track_idx++) { index = cb_index[track_idx]; ixheaacd_acelp_decode_1sp_per_track(index, 4, 0, track_idx, code_vec); } } else if (code_bits == 28) { for (track_idx = 0; track_idx < 2; track_idx++) { index = cb_index[track_idx]; ixheaacd_acelp_decode_2sp_per_track(index, 4, 0, track_idx, code_vec); } for (track_idx = 2; track_idx < 4; track_idx++) { index = cb_index[track_idx]; ixheaacd_acelp_decode_1sp_per_track(index, 4, 0, track_idx, code_vec); } } else if (code_bits == 36) { for (track_idx = 0; track_idx < 4; track_idx++) { index = cb_index[track_idx]; ixheaacd_acelp_decode_2sp_per_track(index, 4, 0, track_idx, code_vec); } } else if (code_bits == 44) { for (track_idx = 0; track_idx < 2; track_idx++) { index = cb_index[track_idx]; ixheaacd_acelp_decode_3sp_per_track(index, 4, 0, track_idx, code_vec); } for (track_idx = 2; track_idx < 4; track_idx++) { index = cb_index[track_idx]; ixheaacd_acelp_decode_2sp_per_track(index, 4, 0, track_idx, code_vec); } } else if (code_bits == 52) { for (track_idx = 0; track_idx < 4; track_idx++) { index = cb_index[track_idx]; ixheaacd_acelp_decode_3sp_per_track(index, 4, 0, track_idx, code_vec); } } else if (code_bits == 64) { for (track_idx = 0; track_idx < 4; track_idx++) { index = ((cb_index[track_idx] << 14) + cb_index[track_idx + 4]); ixheaacd_acelp_decode_4sp_per_track(index, track_idx, code_vec); } } return; } static void ixheaacd_acelp_decode_gains(WORD32 index, FLOAT32 code_vec[], FLOAT32 *pitch_gain, FLOAT32 *codebook_gain, FLOAT32 mean_exc_energy, FLOAT32 *energy) { WORD32 i; FLOAT32 avg_innov_energy, est_gain; const FLOAT32 *gain_table = ixheaacd_int_leave_gain_table; avg_innov_energy = 0.01f; for (i = 0; i < LEN_SUBFR; i++) { avg_innov_energy += code_vec[i] * code_vec[i]; } *energy = avg_innov_energy; avg_innov_energy = (FLOAT32)(10.0 * log10(avg_innov_energy / (FLOAT32)LEN_SUBFR)); est_gain = mean_exc_energy - avg_innov_energy; est_gain = (FLOAT32)pow(10.0, 0.05 * est_gain); *pitch_gain = gain_table[index * 2]; *codebook_gain = gain_table[index * 2 + 1] * est_gain; return; } static VOID ixheaacd_cb_exc_calc(FLOAT32 xcitation_curr[], WORD32 pitch_lag, WORD32 frac) { WORD32 i, j; FLOAT32 s, *x0, *x1, *x2; const FLOAT32 *c1, *c2; x0 = &xcitation_curr[-pitch_lag]; frac = -frac; if (frac < 0) { frac += UP_SAMP; x0--; } for (j = 0; j < LEN_SUBFR + 1; j++) { x1 = x0++; x2 = x1 + 1; c1 = &ixheaacd_interpol_filt[frac]; c2 = &ixheaacd_interpol_filt[UP_SAMP - frac]; s = 0.0; for (i = 0; i < INTER_LP_FIL_ORDER; i++, c1 += UP_SAMP, c2 += UP_SAMP) { s += (*x1--) * (*c1) + (*x2++) * (*c2); } xcitation_curr[j] = s; } return; } WORD32 ixheaacd_acelp_alias_cnx(ia_usac_data_struct *usac_data, ia_td_frame_data_struct *pstr_td_frame_data, WORD32 k, FLOAT32 lp_filt_coeff[], FLOAT32 stability_factor, ia_usac_lpd_decoder_handle st) { WORD32 i, subfr_idx; WORD32 pitch_lag, pitch_lag_frac, index, pitch_flag, pitch_lag_max; WORD32 pitch_lag_min = 0; FLOAT32 tmp, pitch_gain, gain_code, voicing_factor, r_v, innov_energy, pitch_energy, mean_ener_code; FLOAT32 gain_smooth, gain_code0, cpe; FLOAT32 code[LEN_SUBFR], synth_temp[128 + 16]; FLOAT32 post_process_exc[LEN_SUBFR]; FLOAT32 gain_smooth_factor; FLOAT32 *ptr_lp_filt_coeff; WORD32 pitch_min; WORD32 pitch_fr2; WORD32 pitch_fr1; WORD32 pitch_max; WORD32 subfr_nb = 0; WORD16 num_codebits_table[8] = {20, 28, 36, 44, 52, 64, 12, 16}; FLOAT32 x[FAC_LENGTH], xn2[2 * FAC_LENGTH + 16]; WORD32 int_x[FAC_LENGTH]; WORD32 TTT; WORD32 len_subfr = usac_data->len_subfrm; WORD32 fac_length; WORD8 shiftp; WORD32 preshift; WORD32 *ptr_scratch = &usac_data->scratch_buffer[0]; WORD32 *int_xn2 = &usac_data->x_ac_dec[0]; WORD32 loop_count = 0; WORD32 core_mode = pstr_td_frame_data->acelp_core_mode; FLOAT32 *synth_signal = &usac_data->synth_buf[len_subfr * k + MAX_PITCH + (((NUM_FRAMES * usac_data->num_subfrm) / 2) - 1) * LEN_SUBFR]; FLOAT32 *xcitation_curr = &usac_data->exc_buf[len_subfr * k + MAX_PITCH + (INTER_LP_FIL_ORDER + 1)]; FLOAT32 *ptr_pitch_gain = &usac_data->pitch_gain[k * usac_data->num_subfrm + (((NUM_FRAMES * usac_data->num_subfrm) / 2) - 1)]; WORD32 *ptr_pitch = &usac_data->pitch[k * usac_data->num_subfrm + (((NUM_FRAMES * usac_data->num_subfrm) / 2) - 1)]; WORD32 err = 0; fac_length = len_subfr / 2; if (st->mode_prev > 0) { for (i = 0; i < fac_length / 2; i++) { x[i] = st->fac_gain * pstr_td_frame_data->fac[k * FAC_LENGTH + 2 * i]; x[fac_length / 2 + i] = st->fac_gain * pstr_td_frame_data->fac[k * FAC_LENGTH + fac_length - 2 * i - 1]; } for (i = 0; i < fac_length / 8; i++) { x[i] *= st->fac_fd_data[2 * i]; x[fac_length - i - 1] *= st->fac_fd_data[2 * i + 1]; } preshift = 0; shiftp = ixheaacd_float2fix(x, int_x, fac_length); err = ixheaacd_acelp_mdct(int_x, int_xn2, &preshift, fac_length, ptr_scratch); if (err == -1) return err; ixheaacd_fix2float(int_xn2, xn2 + fac_length, fac_length, &shiftp, &preshift); ixheaacd_vec_cnst_mul((2.0f / (FLOAT32)fac_length), xn2 + fac_length, xn2 + fac_length, fac_length); memset(xn2, 0, fac_length * sizeof(FLOAT32)); ixheaacd_lpc_wt_synthesis_tool(st->lp_flt_coeff_a_prev, xn2 + fac_length, fac_length); for (i = 0; i < 2 * fac_length; i++) xn2[i] += synth_signal[i - (2 * fac_length)]; memcpy(synth_signal - fac_length, xn2 + fac_length, fac_length * sizeof(FLOAT32)); tmp = 0.0; ixheaacd_preemphsis_tool_float(xn2, PREEMPH_FILT_FAC, 2 * fac_length, tmp); ptr_lp_filt_coeff = st->lp_flt_coeff_a_prev; TTT = fac_length % LEN_SUBFR; if (TTT != 0) { ixheaacd_residual_tool_float( ptr_lp_filt_coeff, &xn2[fac_length], &xcitation_curr[fac_length - (2 * fac_length)], TTT, 1); ptr_lp_filt_coeff += (ORDER + 1); } loop_count = (fac_length + TTT) / LEN_SUBFR; ixheaacd_residual_tool_float(ptr_lp_filt_coeff, &xn2[fac_length + TTT], &xcitation_curr[TTT - fac_length], LEN_SUBFR, loop_count); } for (i = 0; i < ORDER; i++) synth_temp[i] = synth_signal[i - ORDER] - (PREEMPH_FILT_FAC * synth_signal[i - ORDER - 1]); i = (((st->fscale * TMIN) + (FSCALE_DENOM / 2)) / FSCALE_DENOM) - TMIN; pitch_min = TMIN + i; pitch_fr2 = TFR2 - i; pitch_fr1 = TFR1; pitch_max = TMAX + (6 * i); ptr_lp_filt_coeff = lp_filt_coeff; for (subfr_idx = 0; subfr_idx < len_subfr; subfr_idx += LEN_SUBFR) { pitch_flag = subfr_idx; if ((len_subfr == 256) && (subfr_idx == (2 * LEN_SUBFR))) { pitch_flag = 0; } index = pstr_td_frame_data->acb_index[k * 4 + subfr_nb]; if (pitch_flag == 0) { if (index < (pitch_fr2 - pitch_min) * 4) { pitch_lag = pitch_min + (index / 4); pitch_lag_frac = index - (pitch_lag - pitch_min) * 4; } else if (index < ((pitch_fr2 - pitch_min) * 4 + (pitch_fr1 - pitch_fr2) * 2)) { index -= (pitch_fr2 - pitch_min) * 4; pitch_lag = pitch_fr2 + (index / 2); pitch_lag_frac = index - (pitch_lag - pitch_fr2) * 2; pitch_lag_frac *= 2; } else { pitch_lag = index + pitch_fr1 - ((pitch_fr2 - pitch_min) * 4) - ((pitch_fr1 - pitch_fr2) * 2); pitch_lag_frac = 0; } pitch_lag_min = pitch_lag - 8; if (pitch_lag_min < pitch_min) pitch_lag_min = pitch_min; pitch_lag_max = pitch_lag_min + 15; if (pitch_lag_max > pitch_max) { pitch_lag_max = pitch_max; pitch_lag_min = pitch_lag_max - 15; } } else { pitch_lag = pitch_lag_min + index / 4; pitch_lag_frac = index - (pitch_lag - pitch_lag_min) * 4; } ixheaacd_cb_exc_calc(&xcitation_curr[subfr_idx], pitch_lag, pitch_lag_frac); mean_ener_code = (((FLOAT32)pstr_td_frame_data->mean_energy[k]) * 12.0f) + 18.0f; if (pstr_td_frame_data->ltp_filtering_flag[k * 4 + subfr_nb] == 0) { for (i = 0; i < LEN_SUBFR; i++) code[i] = (FLOAT32)(0.18 * xcitation_curr[i - 1 + subfr_idx] + 0.64 * xcitation_curr[i + subfr_idx] + 0.18 * xcitation_curr[i + 1 + subfr_idx]); ixheaacd_mem_cpy(code, &xcitation_curr[subfr_idx], LEN_SUBFR); } ixheaacd_acelp_decode_pulses_per_track( &(pstr_td_frame_data->icb_index[k * 4 + subfr_nb][0]), num_codebits_table[core_mode], code); tmp = 0.0; ixheaacd_preemphsis_tool_float(code, TILT_CODE, LEN_SUBFR, tmp); i = pitch_lag; if (pitch_lag_frac > 2) i++; if (i >= 0) ixheaacd_acelp_pitch_sharpening(code, i); index = pstr_td_frame_data->gains[k * 4 + subfr_nb]; ixheaacd_acelp_decode_gains(index, code, &pitch_gain, &gain_code, mean_ener_code, &innov_energy); pitch_energy = 0.0; for (i = 0; i < LEN_SUBFR; i++) pitch_energy += xcitation_curr[i + subfr_idx] * xcitation_curr[i + subfr_idx]; pitch_energy *= (pitch_gain * pitch_gain); innov_energy *= gain_code * gain_code; r_v = (FLOAT32)((pitch_energy - innov_energy) / (pitch_energy + innov_energy)); for (i = 0; i < LEN_SUBFR; i++) post_process_exc[i] = pitch_gain * xcitation_curr[i + subfr_idx]; for (i = 0; i < LEN_SUBFR; i++) xcitation_curr[i + subfr_idx] = pitch_gain * xcitation_curr[i + subfr_idx] + gain_code * code[i]; i = pitch_lag; if (pitch_lag_frac > 2) i++; if (i > pitch_max) i = pitch_max; *ptr_pitch++ = i; *ptr_pitch_gain++ = pitch_gain; voicing_factor = (FLOAT32)(0.5 * (1.0 - r_v)); gain_smooth_factor = stability_factor * voicing_factor; gain_code0 = gain_code; if (gain_code0 < st->gain_threshold) { gain_code0 = (FLOAT32)(gain_code0 * 1.19); if (gain_code0 > st->gain_threshold) gain_code0 = st->gain_threshold; } else { gain_code0 = (FLOAT32)(gain_code0 / 1.19); if (gain_code0 < st->gain_threshold) gain_code0 = st->gain_threshold; } st->gain_threshold = gain_code0; gain_smooth = (FLOAT32)((gain_smooth_factor * gain_code0) + ((1.0 - gain_smooth_factor) * gain_code)); for (i = 0; i < LEN_SUBFR; i++) code[i] *= gain_smooth; cpe = (FLOAT32)(0.125 * (1.0 + r_v)); post_process_exc[0] += code[0] - (cpe * code[1]); for (i = 1; i < LEN_SUBFR - 1; i++) post_process_exc[i] += code[i] - (cpe * (code[i - 1] + code[i + 1])); post_process_exc[LEN_SUBFR - 1] += code[LEN_SUBFR - 1] - (cpe * code[LEN_SUBFR - 2]); ixheaacd_synthesis_tool_float(ptr_lp_filt_coeff, post_process_exc, &synth_signal[subfr_idx], LEN_SUBFR, synth_temp); memcpy(synth_temp, &synth_signal[subfr_idx + LEN_SUBFR - ORDER], ORDER * sizeof(FLOAT32)); ptr_lp_filt_coeff += (ORDER + 1); subfr_nb++; } ixheaacd_deemphsis_tool(synth_signal, len_subfr, synth_signal[-1]); memset(synth_temp + 16, 0, 128 * sizeof(FLOAT32)); ixheaacd_synthesis_tool_float1(ptr_lp_filt_coeff, synth_temp + 16, 128); ptr_lp_filt_coeff -= (2 * (ORDER + 1)); memcpy(st->lp_flt_coeff_a_prev, ptr_lp_filt_coeff, (2 * (ORDER + 1)) * sizeof(FLOAT32)); memcpy(st->exc_prev, synth_signal + len_subfr - (1 + fac_length), (1 + fac_length) * sizeof(FLOAT32)); memcpy(st->exc_prev + 1 + fac_length, synth_temp + 16, fac_length * sizeof(FLOAT32)); ixheaacd_deemphsis_tool(st->exc_prev + 1 + fac_length, fac_length, synth_signal[len_subfr - 1]); return err; }