1120 lines
35 KiB
C
1120 lines
35 KiB
C
/*
|
|
* SpanDSP - a series of DSP components for telephony
|
|
*
|
|
* lpc10_decode.c - LPC10 low bit rate speech codec.
|
|
*
|
|
* Written by Steve Underwood <steveu@coppice.org>
|
|
*
|
|
* Copyright (C) 2006 Steve Underwood
|
|
*
|
|
* All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU Lesser General Public License version 2.1,
|
|
* as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
*
|
|
* This code is based on the U.S. Department of Defense reference
|
|
* implementation of the LPC-10 2400 bps Voice Coder. They do not
|
|
* exert copyright claims on their code, and it may be freely used.
|
|
*/
|
|
|
|
#if defined(HAVE_CONFIG_H)
|
|
#include "config.h"
|
|
#endif
|
|
|
|
#include <stdlib.h>
|
|
#include <stdio.h>
|
|
#include <inttypes.h>
|
|
#if defined(HAVE_TGMATH_H)
|
|
#include <tgmath.h>
|
|
#endif
|
|
#if defined(HAVE_MATH_H)
|
|
#include <math.h>
|
|
#endif
|
|
#include "floating_fudge.h"
|
|
#include <memory.h>
|
|
|
|
#include "spandsp/telephony.h"
|
|
#include "spandsp/fast_convert.h"
|
|
#include "spandsp/dc_restore.h"
|
|
#include "spandsp/lpc10.h"
|
|
#include "spandsp/private/lpc10.h"
|
|
|
|
#define LPC10_ORDER 10
|
|
|
|
#if !defined(min)
|
|
#define min(a,b) ((a) <= (b) ? (a) : (b))
|
|
#endif
|
|
#if !defined(max)
|
|
#define max(a,b) ((a) >= (b) ? (a) : (b))
|
|
#endif
|
|
|
|
/* Pseudo random number generator based on Knuth, Vol 2, p. 27. */
|
|
/* lpc10_random - int32_t variable, uniformly distributed over -32768 to 32767 */
|
|
static int32_t lpc10_random(lpc10_decode_state_t *s)
|
|
{
|
|
int32_t ret_val;
|
|
|
|
/* The following is a 16 bit 2's complement addition,
|
|
with overflow checking disabled */
|
|
s->y[s->k] += s->y[s->j];
|
|
ret_val = s->y[s->k];
|
|
if (--s->k < 0)
|
|
s->k = 4;
|
|
if (--s->j < 0)
|
|
s->j = 4;
|
|
return ret_val;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
static __inline__ int32_t pow_ii(int32_t x, int32_t n)
|
|
{
|
|
int32_t pow;
|
|
uint32_t u;
|
|
|
|
if (n <= 0)
|
|
{
|
|
if (n == 0 || x == 1)
|
|
return 1;
|
|
if (x != -1)
|
|
return (x != 0) ? 1/x : 0;
|
|
n = -n;
|
|
}
|
|
u = n;
|
|
for (pow = 1; ; )
|
|
{
|
|
if ((u & 1))
|
|
pow *= x;
|
|
if ((u >>= 1) == 0)
|
|
break;
|
|
x *= x;
|
|
}
|
|
return pow;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
/* Synthesize one pitch epoch */
|
|
static void bsynz(lpc10_decode_state_t *s,
|
|
float coef[],
|
|
int32_t ip,
|
|
int32_t *iv,
|
|
float sout[],
|
|
float rms,
|
|
float ratio,
|
|
float g2pass)
|
|
{
|
|
static const int32_t kexc[25] =
|
|
{
|
|
8, -16, 26, -48, 86, -162, 294, -502, 718, -728, 184,
|
|
672, -610, -672, 184, 728, 718, 502, 294, 162, 86, 48, 26, 16, 8
|
|
};
|
|
int32_t i;
|
|
int32_t j;
|
|
int32_t k;
|
|
int32_t px;
|
|
float noise[166];
|
|
float pulse;
|
|
float r1;
|
|
float gain;
|
|
float xssq;
|
|
float sscale;
|
|
float xy;
|
|
float sum;
|
|
float ssq;
|
|
float lpi0;
|
|
float hpi0;
|
|
|
|
/* MAXPIT + MAXORD = 166 */
|
|
/* Calculate history scale factor XY and scale filter state */
|
|
/* Computing MIN */
|
|
r1 = s->rmso_bsynz/(rms + 1.0e-6f);
|
|
xy = min(r1, 8.0f);
|
|
s->rmso_bsynz = rms;
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
s->exc2[i] = s->exc2[s->ipo + i]*xy;
|
|
s->ipo = ip;
|
|
if (*iv == 0)
|
|
{
|
|
/* Generate white noise for unvoiced */
|
|
for (i = 0; i < ip; i++)
|
|
s->exc[LPC10_ORDER + i] = (float) (lpc10_random(s)/64);
|
|
/* Impulse double excitation for plosives */
|
|
px = (lpc10_random(s) + 32768)*(ip - 1)/65536 + LPC10_ORDER + 1;
|
|
r1 = ratio/4.0f;
|
|
pulse = r1*342;
|
|
if (pulse > 2.0e3f)
|
|
pulse = 2.0e3f;
|
|
s->exc[px - 1] += pulse;
|
|
s->exc[px] -= pulse;
|
|
}
|
|
else
|
|
{
|
|
sscale = sqrtf((float) ip)/6.928f;
|
|
for (i = 0; i < ip; i++)
|
|
{
|
|
s->exc[LPC10_ORDER + i] = 0.0f;
|
|
if (i < 25)
|
|
s->exc[LPC10_ORDER + i] = sscale*kexc[i];
|
|
lpi0 = s->exc[LPC10_ORDER + i];
|
|
s->exc[LPC10_ORDER + i] = s->exc[LPC10_ORDER + i]*0.125f + s->lpi[0]*0.75f + s->lpi[1]*0.125f;
|
|
s->lpi[1] = s->lpi[0];
|
|
s->lpi[0] = lpi0;
|
|
}
|
|
for (i = 0; i < ip; i++)
|
|
{
|
|
noise[LPC10_ORDER + i] = lpc10_random(s)/64.0f;
|
|
hpi0 = noise[LPC10_ORDER + i];
|
|
noise[LPC10_ORDER + i] = noise[LPC10_ORDER + i]*-0.125f + s->hpi[0]*0.25f + s->hpi[1]*-0.125f;
|
|
s->hpi[1] = s->hpi[0];
|
|
s->hpi[0] = hpi0;
|
|
}
|
|
for (i = 0; i < ip; i++)
|
|
s->exc[LPC10_ORDER + i] += noise[LPC10_ORDER + i];
|
|
}
|
|
/* Synthesis filters: */
|
|
/* Modify the excitation with all-zero filter 1 + G*SUM */
|
|
xssq = 0.0f;
|
|
for (i = 0; i < ip; i++)
|
|
{
|
|
k = LPC10_ORDER + i;
|
|
sum = 0.0f;
|
|
for (j = 0; j < LPC10_ORDER; j++)
|
|
sum += coef[j]*s->exc[k - j - 1];
|
|
sum *= g2pass;
|
|
s->exc2[k] = sum + s->exc[k];
|
|
}
|
|
/* Synthesize using the all pole filter 1/(1 - SUM) */
|
|
for (i = 0; i < ip; i++)
|
|
{
|
|
k = LPC10_ORDER + i;
|
|
sum = 0.0f;
|
|
for (j = 0; j < LPC10_ORDER; j++)
|
|
sum += coef[j]*s->exc2[k - j - 1];
|
|
s->exc2[k] = sum + s->exc2[k];
|
|
xssq += s->exc2[k]*s->exc2[k];
|
|
}
|
|
/* Save filter history for next epoch */
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
{
|
|
s->exc[i] = s->exc[ip + i];
|
|
s->exc2[i] = s->exc2[ip + i];
|
|
}
|
|
/* Apply gain to match RMS */
|
|
ssq = rms*rms*ip;
|
|
gain = sqrtf(ssq/xssq);
|
|
for (i = 0; i < ip; i++)
|
|
sout[i] = gain*s->exc2[LPC10_ORDER + i];
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
/* Synthesize a single pitch epoch */
|
|
static int pitsyn(lpc10_decode_state_t *s,
|
|
int voice[],
|
|
int32_t *pitch,
|
|
float *rms,
|
|
float *rc,
|
|
int32_t ivuv[],
|
|
int32_t ipiti[],
|
|
float *rmsi,
|
|
float *rci,
|
|
int32_t *nout,
|
|
float *ratio)
|
|
{
|
|
int32_t rci_dim1;
|
|
int32_t rci_offset;
|
|
int32_t i1;
|
|
int32_t i;
|
|
int32_t j;
|
|
int32_t vflag;
|
|
int32_t jused;
|
|
int32_t lsamp;
|
|
int32_t ip;
|
|
int32_t nl;
|
|
int32_t ivoice;
|
|
int32_t istart;
|
|
float r1;
|
|
float alrn;
|
|
float alro;
|
|
float yarc[10];
|
|
float prop;
|
|
float slope;
|
|
float uvpit;
|
|
float xxy;
|
|
float msix;
|
|
|
|
rci_dim1 = LPC10_ORDER;
|
|
rci_offset = rci_dim1 + 1;
|
|
rci -= rci_offset;
|
|
|
|
if (*rms < 1.0f)
|
|
*rms = 1.0f;
|
|
if (s->rmso < 1.0f)
|
|
s->rmso = 1.0f;
|
|
uvpit = 0.0f;
|
|
*ratio = *rms/(s->rmso + 8.0f);
|
|
if (s->first_pitsyn)
|
|
{
|
|
lsamp = 0;
|
|
ivoice = voice[1];
|
|
if (ivoice == 0)
|
|
*pitch = LPC10_SAMPLES_PER_FRAME/4;
|
|
*nout = LPC10_SAMPLES_PER_FRAME / *pitch;
|
|
s->jsamp = LPC10_SAMPLES_PER_FRAME - *nout * *pitch;
|
|
|
|
i1 = *nout;
|
|
for (i = 0; i < i1; i++)
|
|
{
|
|
for (j = 0; j < LPC10_ORDER; j++)
|
|
rci[j + (i + 1)*rci_dim1 + 1] = rc[j];
|
|
ivuv[i] = ivoice;
|
|
ipiti[i] = *pitch;
|
|
rmsi[i] = *rms;
|
|
}
|
|
s->first_pitsyn = FALSE;
|
|
}
|
|
else
|
|
{
|
|
vflag = 0;
|
|
lsamp = LPC10_SAMPLES_PER_FRAME + s->jsamp;
|
|
slope = (*pitch - s->ipito)/(float) lsamp;
|
|
*nout = 0;
|
|
jused = 0;
|
|
istart = 1;
|
|
if (voice[0] == s->ivoico && voice[1] == voice[0])
|
|
{
|
|
if (voice[1] == 0)
|
|
{
|
|
/* SSUV - - 0 , 0 , 0 */
|
|
*pitch = LPC10_SAMPLES_PER_FRAME/4;
|
|
s->ipito = *pitch;
|
|
if (*ratio > 8.0f)
|
|
s->rmso = *rms;
|
|
}
|
|
/* SSVC - - 1 , 1 , 1 */
|
|
slope = (*pitch - s->ipito)/(float) lsamp;
|
|
ivoice = voice[1];
|
|
}
|
|
else
|
|
{
|
|
if (s->ivoico != 1)
|
|
{
|
|
if (s->ivoico == voice[0])
|
|
{
|
|
/* UV2VC2 - - 0 , 0 , 1 */
|
|
nl = lsamp - LPC10_SAMPLES_PER_FRAME/4;
|
|
}
|
|
else
|
|
{
|
|
/* UV2VC1 - - 0 , 1 , 1 */
|
|
nl = lsamp - LPC10_SAMPLES_PER_FRAME*3/4;
|
|
}
|
|
ipiti[0] = nl/2;
|
|
ipiti[1] = nl - ipiti[0];
|
|
ivuv[0] = 0;
|
|
ivuv[1] = 0;
|
|
rmsi[0] = s->rmso;
|
|
rmsi[1] = s->rmso;
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
{
|
|
rci[i + rci_dim1 + 1] = s->rco[i];
|
|
rci[i + (rci_dim1 << 1) + 1] = s->rco[i];
|
|
s->rco[i] = rc[i];
|
|
}
|
|
slope = 0.0f;
|
|
*nout = 2;
|
|
s->ipito = *pitch;
|
|
jused = nl;
|
|
istart = nl + 1;
|
|
ivoice = 1;
|
|
}
|
|
else
|
|
{
|
|
if (s->ivoico != voice[0])
|
|
{
|
|
/* VC2UV1 - - 1 , 0 , 0 */
|
|
lsamp = LPC10_SAMPLES_PER_FRAME/4 + s->jsamp;
|
|
}
|
|
else
|
|
{
|
|
/* VC2UV2 - - 1 , 1 , 0 */
|
|
lsamp = LPC10_SAMPLES_PER_FRAME*3/4 + s->jsamp;
|
|
}
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
{
|
|
yarc[i] = rc[i];
|
|
rc[i] = s->rco[i];
|
|
}
|
|
ivoice = 1;
|
|
slope = 0.0f;
|
|
vflag = 1;
|
|
}
|
|
}
|
|
/* Here is the value of most variables that are used below, depending on */
|
|
/* the values of IVOICO, VOICE(1), and VOICE(2). VOICE(1) and VOICE(2) */
|
|
/* are input arguments, and IVOICO is the value of VOICE(2) on the */
|
|
/* previous call (see notes for the IF (NOUT .NE. 0) statement near the */
|
|
/* end). Each of these three values is either 0 or 1. These three */
|
|
/* values below are given as 3-bit long strings, in the order IVOICO, */
|
|
/* VOICE(1), and VOICE(2). It appears that the code above assumes that */
|
|
/* the bit sequences 010 and 101 never occur, but I wonder whether a */
|
|
/* large enough number of bit errors in the channel could cause such a */
|
|
/* thing to happen, and if so, could that cause NOUT to ever go over 11? */
|
|
|
|
/* Note that all of the 180 values in the table are floatly LFRAME, but */
|
|
/* 180 has fewer characters, and it makes the table a little more */
|
|
/* concrete. If LFRAME is ever changed, keep this in mind. Similarly, */
|
|
/* 135's are 3*LFRAME/4, and 45's are LFRAME/4. If LFRAME is not a */
|
|
/* multiple of 4, then the 135 for NL-JSAMP is actually LFRAME-LFRAME/4, */
|
|
/* and the 45 for NL-JSAMP is actually LFRAME-3*LFRAME/4. */
|
|
|
|
/* Note that LSAMP-JSAMP is given as the variable. This was just for */
|
|
/* brevity, to avoid adding "+JSAMP" to all of the column entries. */
|
|
/* Similarly for NL-JSAMP. */
|
|
|
|
/* Variable | 000 001 011,010 111 110 100,101 */
|
|
/* ------------+-------------------------------------------------- */
|
|
/* ISTART | 1 NL+1 NL+1 1 1 1 */
|
|
/* LSAMP-JSAMP | 180 180 180 180 135 45 */
|
|
/* IPITO | 45 PITCH PITCH oldPITCH oldPITCH oldPITCH */
|
|
/* SLOPE | 0 0 0 seebelow 0 0 */
|
|
/* JUSED | 0 NL NL 0 0 0 */
|
|
/* PITCH | 45 PITCH PITCH PITCH PITCH PITCH */
|
|
/* NL-JSAMP | -- 135 45 -- -- -- */
|
|
/* VFLAG | 0 0 0 0 1 1 */
|
|
/* NOUT | 0 2 2 0 0 0 */
|
|
/* IVOICE | 0 1 1 1 1 1 */
|
|
|
|
/* while_loop | once once once once twice twice */
|
|
|
|
/* ISTART | -- -- -- -- JUSED+1 JUSED+1 */
|
|
/* LSAMP-JSAMP | -- -- -- -- 180 180 */
|
|
/* IPITO | -- -- -- -- oldPITCH oldPITCH */
|
|
/* SLOPE | -- -- -- -- 0 0 */
|
|
/* JUSED | -- -- -- -- ?? ?? */
|
|
/* PITCH | -- -- -- -- PITCH PITCH */
|
|
/* NL-JSAMP | -- -- -- -- -- -- */
|
|
/* VFLAG | -- -- -- -- 0 0 */
|
|
/* NOUT | -- -- -- -- ?? ?? */
|
|
/* IVOICE | -- -- -- -- 0 0 */
|
|
|
|
/* UVPIT is always 0.0 on the first pass through the DO WHILE (TRUE)
|
|
loop below. */
|
|
|
|
/* The only possible non-0 value of SLOPE (in column 111) is
|
|
(PITCH-IPITO)/FLOAT(LSAMP) */
|
|
|
|
/* Column 101 is identical to 100. Any good properties we can prove
|
|
for 100 will also hold for 101. Similarly for 010 and 011. */
|
|
|
|
/* synths() calls this subroutine with PITCH restricted to the range 20 to
|
|
156. IPITO is similarly restricted to this range, after the first
|
|
call. IP below is also restricted to this range, given the
|
|
definitions of IPITO, SLOPE, UVPIT, and that I is in the range ISTART
|
|
to LSAMP. */
|
|
|
|
for (;;)
|
|
{
|
|
for (i = istart; i <= lsamp; i++)
|
|
{
|
|
r1 = s->ipito + slope*i;
|
|
ip = (int32_t) (r1 + 0.5f);
|
|
if (uvpit != 0.0f)
|
|
ip = (int32_t) uvpit;
|
|
if (ip <= i - jused)
|
|
{
|
|
++(*nout);
|
|
ipiti[*nout - 1] = ip;
|
|
*pitch = ip;
|
|
ivuv[*nout - 1] = ivoice;
|
|
jused += ip;
|
|
prop = (jused - ip/2)/(float) lsamp;
|
|
for (j = 0; j < LPC10_ORDER; j++)
|
|
{
|
|
alro = logf((s->rco[j] + 1)/(1 - s->rco[j]));
|
|
alrn = logf((rc[j] + 1)/(1 - rc[j]));
|
|
xxy = alro + prop*(alrn - alro);
|
|
xxy = expf(xxy);
|
|
rci[j + *nout*rci_dim1 + 1] = (xxy - 1.0f)/(xxy + 1.0f);
|
|
}
|
|
msix = logf(*rms) - logf(s->rmso);
|
|
msix = prop*msix;
|
|
msix = logf(s->rmso) + msix;
|
|
rmsi[*nout - 1] = expf(msix);
|
|
}
|
|
}
|
|
if (vflag != 1)
|
|
break;
|
|
|
|
vflag = 0;
|
|
istart = jused + 1;
|
|
lsamp = LPC10_SAMPLES_PER_FRAME + s->jsamp;
|
|
slope = 0.0f;
|
|
ivoice = 0;
|
|
uvpit = (float) ((lsamp - istart)/2);
|
|
if (uvpit > 90.0f)
|
|
uvpit /= 2;
|
|
s->rmso = *rms;
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
{
|
|
rc[i] = yarc[i];
|
|
s->rco[i] = yarc[i];
|
|
}
|
|
}
|
|
s->jsamp = lsamp - jused;
|
|
}
|
|
if (*nout != 0)
|
|
{
|
|
s->ivoico = voice[1];
|
|
s->ipito = *pitch;
|
|
s->rmso = *rms;
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
s->rco[i] = rc[i];
|
|
}
|
|
return 0;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
static void deemp(lpc10_decode_state_t *s, float x[], int len)
|
|
{
|
|
int i;
|
|
float r1;
|
|
float dei0;
|
|
|
|
for (i = 0; i < len; i++)
|
|
{
|
|
dei0 = x[i];
|
|
r1 = x[i] - s->dei[0]*1.9998f + s->dei[1];
|
|
x[i] = r1 + s->deo[0]*2.5f - s->deo[1]*2.0925f + s->deo[2]*0.585f;
|
|
s->dei[1] = s->dei[0];
|
|
s->dei[0] = dei0;
|
|
s->deo[2] = s->deo[1];
|
|
s->deo[1] = s->deo[0];
|
|
s->deo[0] = x[i];
|
|
}
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
/* Convert reflection coefficients to predictor coefficients */
|
|
static float reflection_coeffs_to_predictor_coeffs(float rc[], float pc[], float gprime)
|
|
{
|
|
float temp[10];
|
|
float g2pass;
|
|
int i;
|
|
int j;
|
|
|
|
g2pass = 1.0f;
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
g2pass *= 1.0f - rc[i]*rc[i];
|
|
g2pass = gprime*sqrtf(g2pass);
|
|
pc[0] = rc[0];
|
|
for (i = 1; i < LPC10_ORDER; i++)
|
|
{
|
|
for (j = 0; j < i; j++)
|
|
temp[j] = pc[j] - rc[i]*pc[i - j - 1];
|
|
for (j = 0; j < i; j++)
|
|
pc[j] = temp[j];
|
|
pc[i] = rc[i];
|
|
}
|
|
return g2pass;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
static int synths(lpc10_decode_state_t *s,
|
|
int voice[],
|
|
int32_t *pitch,
|
|
float *rms,
|
|
float *rc,
|
|
float speech[])
|
|
{
|
|
int32_t i1;
|
|
int32_t ivuv[16];
|
|
int32_t ipiti[16];
|
|
int32_t nout;
|
|
int32_t i;
|
|
int32_t j;
|
|
float rmsi[16];
|
|
float ratio;
|
|
float g2pass;
|
|
float pc[10];
|
|
float rci[160];
|
|
|
|
i1 = min(*pitch, 156);
|
|
*pitch = max(i1, 20);
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
rc[i] = max(min(rc[i], 0.99f), -0.99f);
|
|
pitsyn(s, voice, pitch, rms, rc, ivuv, ipiti, rmsi, rci, &nout, &ratio);
|
|
if (nout > 0)
|
|
{
|
|
for (j = 0; j < nout; j++)
|
|
{
|
|
/* Add synthesized speech for pitch period J to the end of s->buf. */
|
|
g2pass = reflection_coeffs_to_predictor_coeffs(&rci[j*10], pc, 0.7f);
|
|
bsynz(s, pc, ipiti[j], &ivuv[j], &s->buf[s->buflen], rmsi[j], ratio, g2pass);
|
|
deemp(s, &s->buf[s->buflen], ipiti[j]);
|
|
s->buflen += ipiti[j];
|
|
}
|
|
/* Copy first MAXFRM samples from BUF to output array speech (scaling them),
|
|
and then remove them from the beginning of s->buf. */
|
|
|
|
for (i = 0; i < LPC10_SAMPLES_PER_FRAME; i++)
|
|
speech[i] = s->buf[i]/4096.0f;
|
|
s->buflen -= LPC10_SAMPLES_PER_FRAME;
|
|
for (i = 0; i < s->buflen; i++)
|
|
s->buf[i] = s->buf[i + LPC10_SAMPLES_PER_FRAME];
|
|
}
|
|
return 0;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
static void lpc10_unpack(lpc10_frame_t *t, const uint8_t ibits[])
|
|
{
|
|
static const int bit[10] =
|
|
{
|
|
2, 4, 8, 8, 8, 8, 16, 16, 16, 16
|
|
};
|
|
static const int iblist[53] =
|
|
{
|
|
13, 12, 11, 1, 2, 13, 12, 11, 1, 2,
|
|
13, 10, 11, 2, 1, 10, 13, 12, 11, 10,
|
|
2, 13, 12, 11, 10, 2, 1, 12, 7, 6,
|
|
1, 10, 9, 8, 7, 4, 6, 9, 8, 7,
|
|
5, 1, 9, 8, 4, 6, 1, 5, 9, 8,
|
|
7, 5, 6
|
|
};
|
|
int32_t itab[13];
|
|
int x;
|
|
int i;
|
|
|
|
/* ibits is 54 bits of LPC data ordered as follows: */
|
|
/* R1-0, R2-0, R3-0, P-0, A-0, */
|
|
/* R1-1, R2-1, R3-1, P-1, A-1, */
|
|
/* R1-2, R4-0, R3-2, A-2, P-2, R4-1, */
|
|
/* R1-3, R2-2, R3-3, R4-2, A-3, */
|
|
/* R1-4, R2-3, R3-4, R4-3, A-4, */
|
|
/* P-3, R2-4, R7-0, R8-0, P-4, R4-4, */
|
|
/* R5-0, R6-0, R7-1,R10-0, R8-1, */
|
|
/* R5-1, R6-1, R7-2, R9-0, P-5, */
|
|
/* R5-2, R6-2,R10-1, R8-2, P-6, R9-1, */
|
|
/* R5-3, R6-3, R7-3, R9-2, R8-3, SYNC */
|
|
|
|
/* Reconstruct ITAB */
|
|
for (i = 0; i < 13; i++)
|
|
itab[i] = 0;
|
|
for (i = 0; i < 53; i++)
|
|
{
|
|
x = 52 - i;
|
|
x = (ibits[x >> 3] >> (7 - (x & 7))) & 1;
|
|
itab[iblist[52 - i] - 1] = (itab[iblist[52 - i] - 1] << 1) | x;
|
|
}
|
|
/* Sign extend the RC's */
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
{
|
|
if ((itab[i + 3] & bit[i]))
|
|
itab[i + 3] -= (bit[i] << 1);
|
|
}
|
|
/* Restore variables */
|
|
t->ipitch = itab[0];
|
|
t->irms = itab[1];
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
t->irc[i] = itab[LPC10_ORDER - 1 - i + 3];
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
/* Hamming 8, 4 decoder - can correct 1 out of seven bits
|
|
and can detect up to two errors. */
|
|
|
|
/* This subroutine is entered with an eight bit word in INPUT. The 8th */
|
|
/* bit is parity and is stripped off. The remaining 7 bits address the */
|
|
/* hamming 8, 4 table and the output OUTPUT from the table gives the 4 */
|
|
/* bits of corrected data. If bit 4 is set, no error was detected. */
|
|
/* ERRCNT is the number of errors counted. */
|
|
|
|
static int32_t hamming_84_decode(int32_t input, int *errcnt)
|
|
{
|
|
static const uint8_t dactab[128] =
|
|
{
|
|
16, 0, 0, 3, 0, 5, 14, 7, 0, 9, 14, 11, 14, 13, 30, 14,
|
|
0, 9, 2, 7, 4, 7, 7, 23, 9, 25, 10, 9, 12, 9, 14, 7,
|
|
0, 5, 2, 11, 5, 21, 6, 5, 8, 11, 11, 27, 12, 5, 14, 11,
|
|
2, 1, 18, 2, 12, 5, 2, 7, 12, 9, 2, 11, 28, 12, 12, 15,
|
|
0, 3, 3, 19, 4, 13, 6, 3, 8, 13, 10, 3, 13, 29, 14, 13,
|
|
4, 1, 10, 3, 20, 4, 4, 7, 10, 9, 26, 10, 4, 13, 10, 15,
|
|
8, 1, 6, 3, 6, 5, 22, 6, 24, 8, 8, 11, 8, 13, 6, 15,
|
|
1, 17 , 2, 1, 4, 1, 6, 15, 8, 1, 10, 15, 12, 15, 15, 31
|
|
};
|
|
int i;
|
|
int parity;
|
|
int32_t output;
|
|
|
|
parity = input & 255;
|
|
parity ^= parity >> 4;
|
|
parity ^= parity >> 2;
|
|
parity ^= parity >> 1;
|
|
parity &= 1;
|
|
i = dactab[input & 127];
|
|
output = i & 15;
|
|
if ((i & 16))
|
|
{
|
|
/* No errors detected in seven bits */
|
|
if (parity)
|
|
(*errcnt)++;
|
|
}
|
|
else
|
|
{
|
|
/* One or two errors detected */
|
|
(*errcnt)++;
|
|
if (parity == 0)
|
|
{
|
|
/* Two errors detected */
|
|
(*errcnt)++;
|
|
output = -1;
|
|
}
|
|
}
|
|
return output;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
static int32_t median(int32_t d1, int32_t d2, int32_t d3)
|
|
{
|
|
int32_t ret_val;
|
|
|
|
ret_val = d2;
|
|
if (d2 > d1 && d2 > d3)
|
|
{
|
|
ret_val = d1;
|
|
if (d3 > d1)
|
|
ret_val = d3;
|
|
}
|
|
else if (d2 < d1 && d2 < d3)
|
|
{
|
|
ret_val = d1;
|
|
if (d3 < d1)
|
|
ret_val = d3;
|
|
}
|
|
return ret_val;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
static void decode(lpc10_decode_state_t *s,
|
|
lpc10_frame_t *t,
|
|
int voice[],
|
|
int32_t *pitch,
|
|
float *rms,
|
|
float rc[])
|
|
{
|
|
static const int32_t ivtab[32] =
|
|
{
|
|
24960, 24960, 24960, 24960, 25480, 25480, 25483, 25480,
|
|
16640, 1560, 1560, 1560, 16640, 1816, 1563, 1560,
|
|
24960, 24960, 24859, 24856, 26001, 25881, 25915, 25913,
|
|
1560, 1560, 7800, 3640, 1561, 1561, 3643, 3641
|
|
};
|
|
static const float corth[32] =
|
|
{
|
|
32767.0f, 10.0f, 5.0f, 0.0f, 32767.0f, 8.0f, 4.0f, 0.0f,
|
|
32.0f, 6.4f, 3.2f, 0.0f, 32.0f, 6.4f, 3.2f, 0.0f,
|
|
32.0f, 11.2f, 6.4f, 0.0f, 32.0f, 11.2f, 6.4f, 0.0f,
|
|
16.0f, 5.6f, 3.2f, 0.0f, 16.0f, 5.6f, 3.2f, 0.0f
|
|
};
|
|
static const int32_t detau[128] =
|
|
{
|
|
0, 0, 0, 3, 0, 3, 3, 31,
|
|
0, 3, 3, 21, 3, 3, 29, 30,
|
|
0, 3, 3, 20, 3, 25, 27, 26,
|
|
3, 23, 58, 22, 3, 24, 28, 3,
|
|
0, 3, 3, 3, 3, 39, 33, 32,
|
|
3, 37, 35, 36, 3, 38, 34, 3,
|
|
3, 42, 46, 44, 50, 40, 48, 3,
|
|
54, 3, 56, 3, 52, 3, 3, 1,
|
|
0, 3, 3, 108, 3, 78, 100, 104,
|
|
3, 84, 92, 88, 156, 80, 96, 3,
|
|
3, 74, 70, 72, 66, 76, 68, 3,
|
|
62, 3, 60, 3, 64, 3, 3, 1,
|
|
3, 116, 132, 112, 148, 152, 3, 3,
|
|
140, 3, 136, 3, 144, 3, 3, 1,
|
|
124, 120, 128, 3, 3, 3, 3, 1,
|
|
3, 3, 3, 1, 3, 1, 1, 1
|
|
};
|
|
static const int32_t rmst[64] =
|
|
{
|
|
1024, 936, 856, 784, 718, 656, 600, 550,
|
|
502, 460, 420, 384, 352, 328, 294, 270,
|
|
246, 226, 206, 188, 172, 158, 144, 132,
|
|
120, 110, 102, 92, 84, 78, 70, 64,
|
|
60, 54, 50, 46, 42, 38, 34, 32,
|
|
30, 26, 24, 22, 20, 18, 17, 16,
|
|
15, 14, 13, 12, 11, 10, 9, 8,
|
|
7, 6, 5, 4, 3, 2, 1, 0
|
|
};
|
|
static const int32_t detab7[32] =
|
|
{
|
|
4, 11, 18, 25, 32, 39, 46, 53,
|
|
60, 66, 72, 77, 82, 87, 92, 96,
|
|
101, 104, 108, 111, 114, 115, 117, 119,
|
|
121, 122, 123, 124, 125, 126, 127, 127
|
|
};
|
|
static const float descl[8] =
|
|
{
|
|
0.6953f, 0.625f, 0.5781f, 0.5469f, 0.5312f, 0.5391f, 0.4688f, 0.3828f
|
|
};
|
|
static const int32_t deadd[8] =
|
|
{
|
|
1152, -2816, -1536, -3584, -1280, -2432, 768, -1920
|
|
};
|
|
static const int32_t qb[8] =
|
|
{
|
|
511, 511, 1023, 1023, 1023, 1023, 2047, 4095
|
|
};
|
|
static const int32_t nbit[10] =
|
|
{
|
|
8, 8, 5, 5, 4, 4, 4, 4, 3, 2
|
|
};
|
|
static const int32_t zrc[10] =
|
|
{
|
|
0, 0, 0, 0, 0, 3, 0, 2, 0, 0
|
|
};
|
|
static const int32_t bit[5] =
|
|
{
|
|
2, 4, 8, 16, 32
|
|
};
|
|
int32_t ipit;
|
|
int32_t iout;
|
|
int32_t i;
|
|
int32_t icorf;
|
|
int32_t index;
|
|
int32_t ivoic;
|
|
int32_t ixcor;
|
|
int32_t i1;
|
|
int32_t i2;
|
|
int32_t i4;
|
|
int32_t ishift;
|
|
int32_t lsb;
|
|
int errcnt;
|
|
|
|
/* If no error correction, do pitch and voicing then jump to decode */
|
|
i4 = detau[t->ipitch];
|
|
if (!s->error_correction)
|
|
{
|
|
voice[0] = 1;
|
|
voice[1] = 1;
|
|
if (t->ipitch <= 1)
|
|
voice[0] = 0;
|
|
if (t->ipitch == 0 || t->ipitch == 2)
|
|
voice[1] = 0;
|
|
if (i4 <= 4)
|
|
i4 = s->iptold;
|
|
*pitch = i4;
|
|
if (voice[0] == 1 && voice[1] == 1)
|
|
s->iptold = *pitch;
|
|
if (voice[0] != voice[1])
|
|
*pitch = s->iptold;
|
|
}
|
|
else
|
|
{
|
|
/* Do error correction pitch and voicing */
|
|
if (i4 > 4)
|
|
{
|
|
s->dpit[0] = i4;
|
|
ivoic = 2;
|
|
s->iavgp = (s->iavgp*15 + i4 + 8)/16;
|
|
}
|
|
else
|
|
{
|
|
s->dpit[0] = s->iavgp;
|
|
ivoic = i4;
|
|
}
|
|
s->drms[0] = t->irms;
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
s->drc[i][0] = t->irc[i];
|
|
/* Determine index to IVTAB from V/UV decision */
|
|
/* If error rate is high then use alternate table */
|
|
index = (s->ivp2h << 4) + (s->iovoic << 2) + ivoic + 1;
|
|
i1 = ivtab[index - 1];
|
|
ipit = i1 & 3;
|
|
icorf = i1 >> 3;
|
|
if (s->erate < 2048)
|
|
icorf /= 64;
|
|
/* Determine error rate: 4=high 1=low */
|
|
ixcor = 4;
|
|
if (s->erate < 2048)
|
|
ixcor = 3;
|
|
if (s->erate < 1024)
|
|
ixcor = 2;
|
|
if (s->erate < 128)
|
|
ixcor = 1;
|
|
/* Voice/unvoice decision determined from bits 0 and 1 of IVTAB */
|
|
voice[0] = icorf/2 & 1;
|
|
voice[1] = icorf & 1;
|
|
/* Skip decoding on first frame because present data not yet available */
|
|
if (s->first)
|
|
{
|
|
s->first = FALSE;
|
|
/* Assign PITCH a "default" value on the first call, since */
|
|
/* otherwise it would be left uninitialized. The two lines */
|
|
/* below were copied from above, since it seemed like a */
|
|
/* reasonable thing to do for the first call. */
|
|
if (i4 <= 4)
|
|
i4 = s->iptold;
|
|
*pitch = i4;
|
|
}
|
|
else
|
|
{
|
|
/* If bit 4 of ICORF is set then correct RMS and RC(1) - RC(4). */
|
|
/* Determine error rate and correct errors using a Hamming 8,4 code */
|
|
/* during transition of unvoiced frames. If IOUT is negative, */
|
|
/* more than 1 error occurred, use previous frame's parameters. */
|
|
if ((icorf & bit[3]) != 0)
|
|
{
|
|
errcnt = 0;
|
|
lsb = s->drms[1] & 1;
|
|
index = (s->drc[7][1] << 4) + s->drms[1]/2;
|
|
iout = hamming_84_decode(index, &errcnt);
|
|
s->drms[1] = s->drms[2];
|
|
if (iout >= 0)
|
|
s->drms[1] = (iout << 1) + lsb;
|
|
for (i = 1; i <= 4; i++)
|
|
{
|
|
if (i == 1)
|
|
i1 = ((s->drc[8][1] & 7) << 1) + (s->drc[9][1] & 1);
|
|
else
|
|
i1 = s->drc[8 - i][1] & 15;
|
|
i2 = s->drc[4 - i][1] & 31;
|
|
lsb = i2 & 1;
|
|
index = (i1 << 4) + (i2 >> 1);
|
|
iout = hamming_84_decode(index, &errcnt);
|
|
if (iout >= 0)
|
|
{
|
|
iout = (iout << 1) + lsb;
|
|
if ((iout & 16) == 16)
|
|
iout -= 32;
|
|
}
|
|
else
|
|
{
|
|
iout = s->drc[4 - i][2];
|
|
}
|
|
s->drc[4 - i][1] = iout;
|
|
}
|
|
/* Determine error rate */
|
|
s->erate = (int32_t) (s->erate*0.96875f + errcnt*102.0f);
|
|
}
|
|
/* Get unsmoothed RMS, RC's, and PITCH */
|
|
t->irms = s->drms[1];
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
t->irc[i] = s->drc[i][1];
|
|
if (ipit == 1)
|
|
s->dpit[1] = s->dpit[2];
|
|
if (ipit == 3)
|
|
s->dpit[1] = s->dpit[0];
|
|
*pitch = s->dpit[1];
|
|
/* If bit 2 of ICORF is set then smooth RMS and RC's, */
|
|
if ((icorf & bit[1]) != 0)
|
|
{
|
|
if ((float) abs(s->drms[1] - s->drms[0]) >= corth[ixcor + 3]
|
|
&&
|
|
(float) abs(s->drms[1] - s->drms[2]) >= corth[ixcor + 3])
|
|
{
|
|
t->irms = median(s->drms[2], s->drms[1], s->drms[0]);
|
|
}
|
|
for (i = 0; i < 6; i++)
|
|
{
|
|
if ((float) abs(s->drc[i][1] - s->drc[i][0]) >= corth[ixcor + ((i + 3) << 2) - 5]
|
|
&&
|
|
(float) abs(s->drc[i][1] - s->drc[i][2]) >= corth[ixcor + ((i + 3) << 2) - 5])
|
|
{
|
|
t->irc[i] = median(s->drc[i][2], s->drc[i][1], s->drc[i][0]);
|
|
}
|
|
}
|
|
}
|
|
/* If bit 3 of ICORF is set then smooth pitch */
|
|
if ((icorf & bit[2]) != 0)
|
|
{
|
|
if ((float) abs(s->dpit[1] - s->dpit[0]) >= corth[ixcor - 1]
|
|
&&
|
|
(float) abs(s->dpit[1] - s->dpit[2]) >= corth[ixcor - 1])
|
|
{
|
|
*pitch = median(s->dpit[2], s->dpit[1], s->dpit[0]);
|
|
}
|
|
}
|
|
/* If bit 5 of ICORF is set then RC(5) - RC(10) are loaded with
|
|
values so that after quantization bias is removed in decode
|
|
the values will be zero. */
|
|
}
|
|
if ((icorf & bit[4]) != 0)
|
|
{
|
|
for (i = 4; i < LPC10_ORDER; i++)
|
|
t->irc[i] = zrc[i];
|
|
}
|
|
/* Housekeeping - one frame delay */
|
|
s->iovoic = ivoic;
|
|
s->ivp2h = voice[1];
|
|
s->dpit[2] = s->dpit[1];
|
|
s->dpit[1] = s->dpit[0];
|
|
s->drms[2] = s->drms[1];
|
|
s->drms[1] = s->drms[0];
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
{
|
|
s->drc[i][2] = s->drc[i][1];
|
|
s->drc[i][1] = s->drc[i][0];
|
|
}
|
|
}
|
|
/* Decode RMS */
|
|
t->irms = rmst[(31 - t->irms)*2];
|
|
/* Decode RC(1) and RC(2) from log-area-ratios */
|
|
/* Protect from illegal coded value (-16) caused by bit errors */
|
|
for (i = 0; i < 2; i++)
|
|
{
|
|
i2 = t->irc[i];
|
|
i1 = 0;
|
|
if (i2 < 0)
|
|
{
|
|
i1 = 1;
|
|
i2 = -i2;
|
|
if (i2 > 15)
|
|
i2 = 0;
|
|
}
|
|
i2 = detab7[i2*2];
|
|
if (i1 == 1)
|
|
i2 = -i2;
|
|
ishift = 15 - nbit[i];
|
|
t->irc[i] = i2*pow_ii(2, ishift);
|
|
}
|
|
/* Decode RC(3)-RC(10) to sign plus 14 bits */
|
|
for (i = 2; i < LPC10_ORDER; i++)
|
|
{
|
|
ishift = 15 - nbit[i];
|
|
i2 = t->irc[i]*pow_ii(2, ishift) + qb[i - 2];
|
|
t->irc[i] = (int32_t) (i2*descl[i - 2] + deadd[i - 2]);
|
|
}
|
|
/* Scale RMS and RC's to floats */
|
|
*rms = (float) t->irms;
|
|
for (i = 0; i < LPC10_ORDER; i++)
|
|
rc[i] = t->irc[i]/16384.0f;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
SPAN_DECLARE(lpc10_decode_state_t *) lpc10_decode_init(lpc10_decode_state_t *s, int error_correction)
|
|
{
|
|
static const int16_t rand_init[] =
|
|
{
|
|
-21161,
|
|
-8478,
|
|
30892,
|
|
-10216,
|
|
16950
|
|
};
|
|
int i;
|
|
int j;
|
|
|
|
if (s == NULL)
|
|
{
|
|
if ((s = (lpc10_decode_state_t *) malloc(sizeof(*s))) == NULL)
|
|
return NULL;
|
|
}
|
|
|
|
s->error_correction = error_correction;
|
|
|
|
/* State used by function decode */
|
|
s->iptold = 60;
|
|
s->first = TRUE;
|
|
s->ivp2h = 0;
|
|
s->iovoic = 0;
|
|
s->iavgp = 60;
|
|
s->erate = 0;
|
|
for (i = 0; i < 3; i++)
|
|
{
|
|
for (j = 0; j < 10; j++)
|
|
s->drc[j][i] = 0;
|
|
s->dpit[i] = 0;
|
|
s->drms[i] = 0;
|
|
}
|
|
|
|
/* State used by function synths */
|
|
for (i = 0; i < 360; i++)
|
|
s->buf[i] = 0.0f;
|
|
s->buflen = LPC10_SAMPLES_PER_FRAME;
|
|
|
|
/* State used by function pitsyn */
|
|
s->rmso = 1.0f;
|
|
s->first_pitsyn = TRUE;
|
|
|
|
/* State used by function bsynz */
|
|
s->ipo = 0;
|
|
for (i = 0; i < 166; i++)
|
|
{
|
|
s->exc[i] = 0.0f;
|
|
s->exc2[i] = 0.0f;
|
|
}
|
|
for (i = 0; i < 3; i++)
|
|
{
|
|
s->lpi[i] = 0.0f;
|
|
s->hpi[i] = 0.0f;
|
|
}
|
|
s->rmso_bsynz = 0.0f;
|
|
|
|
/* State used by function lpc10_random */
|
|
s->j = 1;
|
|
s->k = 4;
|
|
for (i = 0; i < 5; i++)
|
|
s->y[i] = rand_init[i];
|
|
|
|
/* State used by function deemp */
|
|
for (i = 0; i < 2; i++)
|
|
s->dei[i] = 0.0f;
|
|
for (i = 0; i < 3; i++)
|
|
s->deo[i] = 0.0f;
|
|
|
|
return s;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
SPAN_DECLARE(int) lpc10_decode_release(lpc10_decode_state_t *s)
|
|
{
|
|
return 0;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
SPAN_DECLARE(int) lpc10_decode_free(lpc10_decode_state_t *s)
|
|
{
|
|
free(s);
|
|
return 0;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
|
|
SPAN_DECLARE(int) lpc10_decode(lpc10_decode_state_t *s, int16_t amp[], const uint8_t code[], int len)
|
|
{
|
|
int voice[2];
|
|
int32_t pitch;
|
|
float speech[LPC10_SAMPLES_PER_FRAME];
|
|
float rc[LPC10_ORDER];
|
|
lpc10_frame_t frame;
|
|
float rms;
|
|
int i;
|
|
int j;
|
|
int base;
|
|
|
|
/* Decode 54 bits in 7 bytes to LPC10_SAMPLES_PER_FRAME speech samples. */
|
|
len /= 7;
|
|
for (i = 0; i < len; i++)
|
|
{
|
|
lpc10_unpack(&frame, &code[i*7]);
|
|
decode(s, &frame, voice, &pitch, &rms, rc);
|
|
synths(s, voice, &pitch, &rms, rc, speech);
|
|
base = i*LPC10_SAMPLES_PER_FRAME;
|
|
for (j = 0; j < LPC10_SAMPLES_PER_FRAME; j++)
|
|
amp[base + j] = (int16_t) lfastrintf(32768.0f*speech[j]);
|
|
}
|
|
|
|
return len*LPC10_SAMPLES_PER_FRAME;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
/*- End of file ------------------------------------------------------------*/
|