mirror of
https://github.com/oxen-io/session-android.git
synced 2025-01-07 22:27:42 +00:00
383 lines
13 KiB
C
383 lines
13 KiB
C
|
/*
|
||
|
* Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
|
||
|
*
|
||
|
* Use of this source code is governed by a BSD-style license
|
||
|
* that can be found in the LICENSE file in the root of the source
|
||
|
* tree. An additional intellectual property rights grant can be found
|
||
|
* in the file PATENTS. All contributing project authors may
|
||
|
* be found in the AUTHORS file in the root of the source tree.
|
||
|
*/
|
||
|
|
||
|
/******************************************************************
|
||
|
|
||
|
iLBC Speech Coder ANSI-C Source Code
|
||
|
|
||
|
WebRtcIlbcfix_EnhancerInterface.c
|
||
|
|
||
|
******************************************************************/
|
||
|
|
||
|
#include <string.h>
|
||
|
|
||
|
#include "defines.h"
|
||
|
#include "constants.h"
|
||
|
#include "xcorr_coef.h"
|
||
|
#include "enhancer.h"
|
||
|
#include "hp_output.h"
|
||
|
|
||
|
|
||
|
|
||
|
/*----------------------------------------------------------------*
|
||
|
* interface for enhancer
|
||
|
*---------------------------------------------------------------*/
|
||
|
|
||
|
int WebRtcIlbcfix_EnhancerInterface( /* (o) Estimated lag in end of in[] */
|
||
|
int16_t *out, /* (o) enhanced signal */
|
||
|
int16_t *in, /* (i) unenhanced signal */
|
||
|
iLBC_Dec_Inst_t *iLBCdec_inst /* (i) buffers etc */
|
||
|
){
|
||
|
int iblock;
|
||
|
int lag=20, tlag=20;
|
||
|
int inLen=iLBCdec_inst->blockl+120;
|
||
|
int16_t scale, scale1, plc_blockl;
|
||
|
int16_t *enh_buf, *enh_period;
|
||
|
int32_t tmp1, tmp2, max, new_blocks;
|
||
|
int16_t *enh_bufPtr1;
|
||
|
int i, k;
|
||
|
int16_t EnChange;
|
||
|
int16_t SqrtEnChange;
|
||
|
int16_t inc;
|
||
|
int16_t win;
|
||
|
int16_t *tmpW16ptr;
|
||
|
int16_t startPos;
|
||
|
int16_t *plc_pred;
|
||
|
int16_t *target, *regressor;
|
||
|
int16_t max16;
|
||
|
int shifts;
|
||
|
int32_t ener;
|
||
|
int16_t enerSh;
|
||
|
int16_t corrSh;
|
||
|
int16_t ind, sh;
|
||
|
int16_t start, stop;
|
||
|
/* Stack based */
|
||
|
int16_t totsh[3];
|
||
|
int16_t downsampled[(BLOCKL_MAX+120)>>1]; /* length 180 */
|
||
|
int32_t corr32[50];
|
||
|
int32_t corrmax[3];
|
||
|
int16_t corr16[3];
|
||
|
int16_t en16[3];
|
||
|
int16_t lagmax[3];
|
||
|
|
||
|
plc_pred = downsampled; /* Reuse memory since plc_pred[ENH_BLOCKL] and
|
||
|
downsampled are non overlapping */
|
||
|
enh_buf=iLBCdec_inst->enh_buf;
|
||
|
enh_period=iLBCdec_inst->enh_period;
|
||
|
|
||
|
/* Copy in the new data into the enhancer buffer */
|
||
|
memmove(enh_buf, &enh_buf[iLBCdec_inst->blockl],
|
||
|
(ENH_BUFL - iLBCdec_inst->blockl) * sizeof(*enh_buf));
|
||
|
|
||
|
WEBRTC_SPL_MEMCPY_W16(&enh_buf[ENH_BUFL-iLBCdec_inst->blockl], in,
|
||
|
iLBCdec_inst->blockl);
|
||
|
|
||
|
/* Set variables that are dependent on frame size */
|
||
|
if (iLBCdec_inst->mode==30) {
|
||
|
plc_blockl=ENH_BLOCKL;
|
||
|
new_blocks=3;
|
||
|
startPos=320; /* Start position for enhancement
|
||
|
(640-new_blocks*ENH_BLOCKL-80) */
|
||
|
} else {
|
||
|
plc_blockl=40;
|
||
|
new_blocks=2;
|
||
|
startPos=440; /* Start position for enhancement
|
||
|
(640-new_blocks*ENH_BLOCKL-40) */
|
||
|
}
|
||
|
|
||
|
/* Update the pitch prediction for each enhancer block, move the old ones */
|
||
|
memmove(enh_period, &enh_period[new_blocks],
|
||
|
(ENH_NBLOCKS_TOT - new_blocks) * sizeof(*enh_period));
|
||
|
|
||
|
k=WebRtcSpl_DownsampleFast(
|
||
|
enh_buf+ENH_BUFL-inLen, /* Input samples */
|
||
|
(int16_t)(inLen+ENH_BUFL_FILTEROVERHEAD),
|
||
|
downsampled,
|
||
|
(int16_t)WEBRTC_SPL_RSHIFT_W16(inLen, 1),
|
||
|
(int16_t*)WebRtcIlbcfix_kLpFiltCoefs, /* Coefficients in Q12 */
|
||
|
FILTERORDER_DS_PLUS1, /* Length of filter (order-1) */
|
||
|
FACTOR_DS,
|
||
|
DELAY_DS);
|
||
|
|
||
|
/* Estimate the pitch in the down sampled domain. */
|
||
|
for(iblock = 0; iblock<new_blocks; iblock++){
|
||
|
|
||
|
/* references */
|
||
|
i=60+WEBRTC_SPL_MUL_16_16(iblock,ENH_BLOCKL_HALF);
|
||
|
target=downsampled+i;
|
||
|
regressor=downsampled+i-10;
|
||
|
|
||
|
/* scaling */
|
||
|
max16=WebRtcSpl_MaxAbsValueW16(®ressor[-50],
|
||
|
(int16_t)(ENH_BLOCKL_HALF+50-1));
|
||
|
shifts = WebRtcSpl_GetSizeInBits(WEBRTC_SPL_MUL_16_16(max16, max16)) - 25;
|
||
|
shifts = WEBRTC_SPL_MAX(0, shifts);
|
||
|
|
||
|
/* compute cross correlation */
|
||
|
WebRtcSpl_CrossCorrelation(corr32, target, regressor,
|
||
|
ENH_BLOCKL_HALF, 50, (int16_t)shifts, -1);
|
||
|
|
||
|
/* Find 3 highest correlations that should be compared for the
|
||
|
highest (corr*corr)/ener */
|
||
|
|
||
|
for (i=0;i<2;i++) {
|
||
|
lagmax[i] = WebRtcSpl_MaxIndexW32(corr32, 50);
|
||
|
corrmax[i] = corr32[lagmax[i]];
|
||
|
start = lagmax[i] - 2;
|
||
|
stop = lagmax[i] + 2;
|
||
|
start = WEBRTC_SPL_MAX(0, start);
|
||
|
stop = WEBRTC_SPL_MIN(49, stop);
|
||
|
for (k=start; k<=stop; k++) {
|
||
|
corr32[k] = 0;
|
||
|
}
|
||
|
}
|
||
|
lagmax[2] = WebRtcSpl_MaxIndexW32(corr32, 50);
|
||
|
corrmax[2] = corr32[lagmax[2]];
|
||
|
|
||
|
/* Calculate normalized corr^2 and ener */
|
||
|
for (i=0;i<3;i++) {
|
||
|
corrSh = 15-WebRtcSpl_GetSizeInBits(corrmax[i]);
|
||
|
ener = WebRtcSpl_DotProductWithScale(®ressor[-lagmax[i]],
|
||
|
®ressor[-lagmax[i]],
|
||
|
ENH_BLOCKL_HALF, shifts);
|
||
|
enerSh = 15-WebRtcSpl_GetSizeInBits(ener);
|
||
|
corr16[i] = (int16_t)WEBRTC_SPL_SHIFT_W32(corrmax[i], corrSh);
|
||
|
corr16[i] = (int16_t)WEBRTC_SPL_MUL_16_16_RSFT(corr16[i],
|
||
|
corr16[i], 16);
|
||
|
en16[i] = (int16_t)WEBRTC_SPL_SHIFT_W32(ener, enerSh);
|
||
|
totsh[i] = enerSh - WEBRTC_SPL_LSHIFT_W32(corrSh, 1);
|
||
|
}
|
||
|
|
||
|
/* Compare lagmax[0..3] for the (corr^2)/ener criteria */
|
||
|
ind = 0;
|
||
|
for (i=1; i<3; i++) {
|
||
|
if (totsh[ind] > totsh[i]) {
|
||
|
sh = WEBRTC_SPL_MIN(31, totsh[ind]-totsh[i]);
|
||
|
if ( WEBRTC_SPL_MUL_16_16(corr16[ind], en16[i]) <
|
||
|
WEBRTC_SPL_MUL_16_16_RSFT(corr16[i], en16[ind], sh)) {
|
||
|
ind = i;
|
||
|
}
|
||
|
} else {
|
||
|
sh = WEBRTC_SPL_MIN(31, totsh[i]-totsh[ind]);
|
||
|
if (WEBRTC_SPL_MUL_16_16_RSFT(corr16[ind], en16[i], sh) <
|
||
|
WEBRTC_SPL_MUL_16_16(corr16[i], en16[ind])) {
|
||
|
ind = i;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
lag = lagmax[ind] + 10;
|
||
|
|
||
|
/* Store the estimated lag in the non-downsampled domain */
|
||
|
enh_period[ENH_NBLOCKS_TOT-new_blocks+iblock] =
|
||
|
(int16_t)WEBRTC_SPL_MUL_16_16(lag, 8);
|
||
|
|
||
|
/* Store the estimated lag for backward PLC */
|
||
|
if (iLBCdec_inst->prev_enh_pl==1) {
|
||
|
if (!iblock) {
|
||
|
tlag = WEBRTC_SPL_MUL_16_16(lag, 2);
|
||
|
}
|
||
|
} else {
|
||
|
if (iblock==1) {
|
||
|
tlag = WEBRTC_SPL_MUL_16_16(lag, 2);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
lag = WEBRTC_SPL_MUL_16_16(lag, 2);
|
||
|
}
|
||
|
|
||
|
if ((iLBCdec_inst->prev_enh_pl==1)||(iLBCdec_inst->prev_enh_pl==2)) {
|
||
|
|
||
|
/* Calculate the best lag of the new frame
|
||
|
This is used to interpolate backwards and mix with the PLC'd data
|
||
|
*/
|
||
|
|
||
|
/* references */
|
||
|
target=in;
|
||
|
regressor=in+tlag-1;
|
||
|
|
||
|
/* scaling */
|
||
|
max16=WebRtcSpl_MaxAbsValueW16(regressor, (int16_t)(plc_blockl+3-1));
|
||
|
if (max16>5000)
|
||
|
shifts=2;
|
||
|
else
|
||
|
shifts=0;
|
||
|
|
||
|
/* compute cross correlation */
|
||
|
WebRtcSpl_CrossCorrelation(corr32, target, regressor,
|
||
|
plc_blockl, 3, (int16_t)shifts, 1);
|
||
|
|
||
|
/* find lag */
|
||
|
lag=WebRtcSpl_MaxIndexW32(corr32, 3);
|
||
|
lag+=tlag-1;
|
||
|
|
||
|
/* Copy the backward PLC to plc_pred */
|
||
|
|
||
|
if (iLBCdec_inst->prev_enh_pl==1) {
|
||
|
if (lag>plc_blockl) {
|
||
|
WEBRTC_SPL_MEMCPY_W16(plc_pred, &in[lag-plc_blockl], plc_blockl);
|
||
|
} else {
|
||
|
WEBRTC_SPL_MEMCPY_W16(&plc_pred[plc_blockl-lag], in, lag);
|
||
|
WEBRTC_SPL_MEMCPY_W16(
|
||
|
plc_pred, &enh_buf[ENH_BUFL-iLBCdec_inst->blockl-plc_blockl+lag],
|
||
|
(plc_blockl-lag));
|
||
|
}
|
||
|
} else {
|
||
|
int pos;
|
||
|
|
||
|
pos = plc_blockl;
|
||
|
|
||
|
while (lag<pos) {
|
||
|
WEBRTC_SPL_MEMCPY_W16(&plc_pred[pos-lag], in, lag);
|
||
|
pos = pos - lag;
|
||
|
}
|
||
|
WEBRTC_SPL_MEMCPY_W16(plc_pred, &in[lag-pos], pos);
|
||
|
|
||
|
}
|
||
|
|
||
|
if (iLBCdec_inst->prev_enh_pl==1) {
|
||
|
/* limit energy change
|
||
|
if energy in backward PLC is more than 4 times higher than the forward
|
||
|
PLC, then reduce the energy in the backward PLC vector:
|
||
|
sample 1...len-16 set energy of the to 4 times forward PLC
|
||
|
sample len-15..len interpolate between 4 times fw PLC and bw PLC energy
|
||
|
|
||
|
Note: Compared to floating point code there is a slight change,
|
||
|
the window is 16 samples long instead of 10 samples to simplify the
|
||
|
calculations
|
||
|
*/
|
||
|
|
||
|
max=WebRtcSpl_MaxAbsValueW16(
|
||
|
&enh_buf[ENH_BUFL-iLBCdec_inst->blockl-plc_blockl], plc_blockl);
|
||
|
max16=WebRtcSpl_MaxAbsValueW16(plc_pred, plc_blockl);
|
||
|
max = WEBRTC_SPL_MAX(max, max16);
|
||
|
scale=22-(int16_t)WebRtcSpl_NormW32(max);
|
||
|
scale=WEBRTC_SPL_MAX(scale,0);
|
||
|
|
||
|
tmp2 = WebRtcSpl_DotProductWithScale(
|
||
|
&enh_buf[ENH_BUFL-iLBCdec_inst->blockl-plc_blockl],
|
||
|
&enh_buf[ENH_BUFL-iLBCdec_inst->blockl-plc_blockl],
|
||
|
plc_blockl, scale);
|
||
|
tmp1 = WebRtcSpl_DotProductWithScale(plc_pred, plc_pred,
|
||
|
plc_blockl, scale);
|
||
|
|
||
|
/* Check the energy difference */
|
||
|
if ((tmp1>0)&&((tmp1>>2)>tmp2)) {
|
||
|
/* EnChange is now guaranteed to be <0.5
|
||
|
Calculate EnChange=tmp2/tmp1 in Q16
|
||
|
*/
|
||
|
|
||
|
scale1=(int16_t)WebRtcSpl_NormW32(tmp1);
|
||
|
tmp1=WEBRTC_SPL_SHIFT_W32(tmp1, (scale1-16)); /* using 15 bits */
|
||
|
|
||
|
tmp2=WEBRTC_SPL_SHIFT_W32(tmp2, (scale1));
|
||
|
EnChange = (int16_t)WebRtcSpl_DivW32W16(tmp2,
|
||
|
(int16_t)tmp1);
|
||
|
|
||
|
/* Calculate the Sqrt of the energy in Q15 ((14+16)/2) */
|
||
|
SqrtEnChange = (int16_t)WebRtcSpl_SqrtFloor(
|
||
|
WEBRTC_SPL_LSHIFT_W32((int32_t)EnChange, 14));
|
||
|
|
||
|
|
||
|
/* Multiply first part of vector with 2*SqrtEnChange */
|
||
|
WebRtcSpl_ScaleVector(plc_pred, plc_pred, SqrtEnChange,
|
||
|
(int16_t)(plc_blockl-16), 14);
|
||
|
|
||
|
/* Calculate increase parameter for window part (16 last samples) */
|
||
|
/* (1-2*SqrtEnChange)/16 in Q15 */
|
||
|
inc=(2048-WEBRTC_SPL_RSHIFT_W16(SqrtEnChange, 3));
|
||
|
|
||
|
win=0;
|
||
|
tmpW16ptr=&plc_pred[plc_blockl-16];
|
||
|
|
||
|
for (i=16;i>0;i--) {
|
||
|
(*tmpW16ptr)=(int16_t)WEBRTC_SPL_MUL_16_16_RSFT(
|
||
|
(*tmpW16ptr), (SqrtEnChange+(win>>1)), 14);
|
||
|
/* multiply by (2.0*SqrtEnChange+win) */
|
||
|
|
||
|
win += inc;
|
||
|
tmpW16ptr++;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* Make the linear interpolation between the forward PLC'd data
|
||
|
and the backward PLC'd data (from the new frame)
|
||
|
*/
|
||
|
|
||
|
if (plc_blockl==40) {
|
||
|
inc=400; /* 1/41 in Q14 */
|
||
|
} else { /* plc_blockl==80 */
|
||
|
inc=202; /* 1/81 in Q14 */
|
||
|
}
|
||
|
win=0;
|
||
|
enh_bufPtr1=&enh_buf[ENH_BUFL-1-iLBCdec_inst->blockl];
|
||
|
for (i=0; i<plc_blockl; i++) {
|
||
|
win+=inc;
|
||
|
*enh_bufPtr1 =
|
||
|
(int16_t)WEBRTC_SPL_MUL_16_16_RSFT((*enh_bufPtr1), win, 14);
|
||
|
*enh_bufPtr1 += (int16_t)WEBRTC_SPL_MUL_16_16_RSFT(
|
||
|
(16384-win), plc_pred[plc_blockl-1-i], 14);
|
||
|
enh_bufPtr1--;
|
||
|
}
|
||
|
} else {
|
||
|
int16_t *synt = &downsampled[LPC_FILTERORDER];
|
||
|
|
||
|
enh_bufPtr1=&enh_buf[ENH_BUFL-iLBCdec_inst->blockl-plc_blockl];
|
||
|
WEBRTC_SPL_MEMCPY_W16(enh_bufPtr1, plc_pred, plc_blockl);
|
||
|
|
||
|
/* Clear fileter memory */
|
||
|
WebRtcSpl_MemSetW16(iLBCdec_inst->syntMem, 0, LPC_FILTERORDER);
|
||
|
WebRtcSpl_MemSetW16(iLBCdec_inst->hpimemy, 0, 4);
|
||
|
WebRtcSpl_MemSetW16(iLBCdec_inst->hpimemx, 0, 2);
|
||
|
|
||
|
/* Initialize filter memory by filtering through 2 lags */
|
||
|
WEBRTC_SPL_MEMCPY_W16(&synt[-LPC_FILTERORDER], iLBCdec_inst->syntMem,
|
||
|
LPC_FILTERORDER);
|
||
|
WebRtcSpl_FilterARFastQ12(
|
||
|
enh_bufPtr1,
|
||
|
synt,
|
||
|
&iLBCdec_inst->old_syntdenum[
|
||
|
(iLBCdec_inst->nsub-1)*(LPC_FILTERORDER+1)],
|
||
|
LPC_FILTERORDER+1, (int16_t)lag);
|
||
|
|
||
|
WEBRTC_SPL_MEMCPY_W16(&synt[-LPC_FILTERORDER], &synt[lag-LPC_FILTERORDER],
|
||
|
LPC_FILTERORDER);
|
||
|
WebRtcIlbcfix_HpOutput(synt, (int16_t*)WebRtcIlbcfix_kHpOutCoefs,
|
||
|
iLBCdec_inst->hpimemy, iLBCdec_inst->hpimemx,
|
||
|
(int16_t)lag);
|
||
|
WebRtcSpl_FilterARFastQ12(
|
||
|
enh_bufPtr1, synt,
|
||
|
&iLBCdec_inst->old_syntdenum[
|
||
|
(iLBCdec_inst->nsub-1)*(LPC_FILTERORDER+1)],
|
||
|
LPC_FILTERORDER+1, (int16_t)lag);
|
||
|
|
||
|
WEBRTC_SPL_MEMCPY_W16(iLBCdec_inst->syntMem, &synt[lag-LPC_FILTERORDER],
|
||
|
LPC_FILTERORDER);
|
||
|
WebRtcIlbcfix_HpOutput(synt, (int16_t*)WebRtcIlbcfix_kHpOutCoefs,
|
||
|
iLBCdec_inst->hpimemy, iLBCdec_inst->hpimemx,
|
||
|
(int16_t)lag);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
|
||
|
/* Perform enhancement block by block */
|
||
|
|
||
|
for (iblock = 0; iblock<new_blocks; iblock++) {
|
||
|
WebRtcIlbcfix_Enhancer(out+WEBRTC_SPL_MUL_16_16(iblock, ENH_BLOCKL),
|
||
|
enh_buf,
|
||
|
ENH_BUFL,
|
||
|
(int16_t)(WEBRTC_SPL_MUL_16_16(iblock, ENH_BLOCKL)+startPos),
|
||
|
enh_period,
|
||
|
(int16_t*)WebRtcIlbcfix_kEnhPlocs, ENH_NBLOCKS_TOT);
|
||
|
}
|
||
|
|
||
|
return (lag);
|
||
|
}
|