232 lines
5.9 KiB
C
232 lines
5.9 KiB
C
|
/*
|
||
|
* DCA ADPCM engine
|
||
|
* Copyright (C) 2017 Daniil Cherednik
|
||
|
*
|
||
|
* This file is part of FFmpeg.
|
||
|
*
|
||
|
* FFmpeg is free software; you can redistribute it and/or
|
||
|
* modify it under the terms of the GNU Lesser General Public
|
||
|
* License as published by the Free Software Foundation; either
|
||
|
* version 2.1 of the License, or (at your option) any later version.
|
||
|
*
|
||
|
* FFmpeg is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
* Lesser General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU Lesser General Public
|
||
|
* License along with FFmpeg; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
*/
|
||
|
|
||
|
|
||
|
#include "dcaadpcm.h"
|
||
|
#include "dcaenc.h"
|
||
|
#include "dca_core.h"
|
||
|
#include "mathops.h"
|
||
|
|
||
|
typedef int32_t premultiplied_coeffs[10];
|
||
|
|
||
|
//assume we have DCA_ADPCM_COEFFS values before x
|
||
|
static inline int64_t calc_corr(const int32_t *x, int len, int j, int k)
|
||
|
{
|
||
|
int n;
|
||
|
int64_t s = 0;
|
||
|
for (n = 0; n < len; n++)
|
||
|
s += MUL64(x[n-j], x[n-k]);
|
||
|
return s;
|
||
|
}
|
||
|
|
||
|
static inline int64_t apply_filter(const int16_t a[DCA_ADPCM_COEFFS], const int64_t corr[15], const int32_t aa[10])
|
||
|
{
|
||
|
int64_t err = 0;
|
||
|
int64_t tmp = 0;
|
||
|
|
||
|
err = corr[0];
|
||
|
|
||
|
tmp += MUL64(a[0], corr[1]);
|
||
|
tmp += MUL64(a[1], corr[2]);
|
||
|
tmp += MUL64(a[2], corr[3]);
|
||
|
tmp += MUL64(a[3], corr[4]);
|
||
|
|
||
|
tmp = norm__(tmp, 13);
|
||
|
tmp += tmp;
|
||
|
|
||
|
err -= tmp;
|
||
|
tmp = 0;
|
||
|
|
||
|
tmp += MUL64(corr[5], aa[0]);
|
||
|
tmp += MUL64(corr[6], aa[1]);
|
||
|
tmp += MUL64(corr[7], aa[2]);
|
||
|
tmp += MUL64(corr[8], aa[3]);
|
||
|
|
||
|
tmp += MUL64(corr[9], aa[4]);
|
||
|
tmp += MUL64(corr[10], aa[5]);
|
||
|
tmp += MUL64(corr[11], aa[6]);
|
||
|
|
||
|
tmp += MUL64(corr[12], aa[7]);
|
||
|
tmp += MUL64(corr[13], aa[8]);
|
||
|
|
||
|
tmp += MUL64(corr[14], aa[9]);
|
||
|
|
||
|
tmp = norm__(tmp, 26);
|
||
|
|
||
|
err += tmp;
|
||
|
|
||
|
return llabs(err);
|
||
|
}
|
||
|
|
||
|
static int64_t find_best_filter(const DCAADPCMEncContext *s, const int32_t *in, int len)
|
||
|
{
|
||
|
const premultiplied_coeffs *precalc_data = s->private_data;
|
||
|
int i, j, k = 0;
|
||
|
int vq = -1;
|
||
|
int64_t err;
|
||
|
int64_t min_err = 1ll << 62;
|
||
|
int64_t corr[15];
|
||
|
|
||
|
for (i = 0; i <= DCA_ADPCM_COEFFS; i++)
|
||
|
for (j = i; j <= DCA_ADPCM_COEFFS; j++)
|
||
|
corr[k++] = calc_corr(in+4, len, i, j);
|
||
|
|
||
|
for (i = 0; i < DCA_ADPCM_VQCODEBOOK_SZ; i++) {
|
||
|
err = apply_filter(ff_dca_adpcm_vb[i], corr, *precalc_data);
|
||
|
if (err < min_err) {
|
||
|
min_err = err;
|
||
|
vq = i;
|
||
|
}
|
||
|
precalc_data++;
|
||
|
}
|
||
|
|
||
|
return vq;
|
||
|
}
|
||
|
|
||
|
static inline int64_t calc_prediction_gain(int pred_vq, const int32_t *in, int32_t *out, int len)
|
||
|
{
|
||
|
int i;
|
||
|
int32_t error;
|
||
|
|
||
|
int64_t signal_energy = 0;
|
||
|
int64_t error_energy = 0;
|
||
|
|
||
|
for (i = 0; i < len; i++) {
|
||
|
error = in[DCA_ADPCM_COEFFS + i] - ff_dcaadpcm_predict(pred_vq, in + i);
|
||
|
out[i] = error;
|
||
|
signal_energy += MUL64(in[DCA_ADPCM_COEFFS + i], in[DCA_ADPCM_COEFFS + i]);
|
||
|
error_energy += MUL64(error, error);
|
||
|
}
|
||
|
|
||
|
if (!error_energy)
|
||
|
return -1;
|
||
|
|
||
|
return signal_energy / error_energy;
|
||
|
}
|
||
|
|
||
|
int ff_dcaadpcm_subband_analysis(const DCAADPCMEncContext *s, const int32_t *in, int len, int *diff)
|
||
|
{
|
||
|
int pred_vq, i;
|
||
|
int32_t input_buffer[16 + DCA_ADPCM_COEFFS];
|
||
|
int32_t input_buffer2[16 + DCA_ADPCM_COEFFS];
|
||
|
|
||
|
int32_t max = 0;
|
||
|
int shift_bits;
|
||
|
uint64_t pg = 0;
|
||
|
|
||
|
for (i = 0; i < len + DCA_ADPCM_COEFFS; i++)
|
||
|
max |= FFABS(in[i]);
|
||
|
|
||
|
// normalize input to simplify apply_filter
|
||
|
shift_bits = av_log2(max) - 11;
|
||
|
|
||
|
for (i = 0; i < len + DCA_ADPCM_COEFFS; i++) {
|
||
|
input_buffer[i] = norm__(in[i], 7);
|
||
|
input_buffer2[i] = norm__(in[i], shift_bits);
|
||
|
}
|
||
|
|
||
|
pred_vq = find_best_filter(s, input_buffer2, len);
|
||
|
|
||
|
if (pred_vq < 0)
|
||
|
return -1;
|
||
|
|
||
|
pg = calc_prediction_gain(pred_vq, input_buffer, diff, len);
|
||
|
|
||
|
// Greater than 10db (10*log(10)) prediction gain to use ADPCM.
|
||
|
// TODO: Tune it.
|
||
|
if (pg < 10)
|
||
|
return -1;
|
||
|
|
||
|
for (i = 0; i < len; i++)
|
||
|
diff[i] <<= 7;
|
||
|
|
||
|
return pred_vq;
|
||
|
}
|
||
|
|
||
|
static void precalc(premultiplied_coeffs *data)
|
||
|
{
|
||
|
int i, j, k;
|
||
|
|
||
|
for (i = 0; i < DCA_ADPCM_VQCODEBOOK_SZ; i++) {
|
||
|
int id = 0;
|
||
|
int32_t t = 0;
|
||
|
for (j = 0; j < DCA_ADPCM_COEFFS; j++) {
|
||
|
for (k = j; k < DCA_ADPCM_COEFFS; k++) {
|
||
|
t = (int32_t)ff_dca_adpcm_vb[i][j] * (int32_t)ff_dca_adpcm_vb[i][k];
|
||
|
if (j != k)
|
||
|
t *= 2;
|
||
|
(*data)[id++] = t;
|
||
|
}
|
||
|
}
|
||
|
data++;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
int ff_dcaadpcm_do_real(int pred_vq_index,
|
||
|
softfloat quant, int32_t scale_factor, int32_t step_size,
|
||
|
const int32_t *prev_hist, const int32_t *in, int32_t *next_hist, int32_t *out,
|
||
|
int len, int32_t peak)
|
||
|
{
|
||
|
int i;
|
||
|
int64_t delta;
|
||
|
int32_t dequant_delta;
|
||
|
int32_t work_bufer[16 + DCA_ADPCM_COEFFS];
|
||
|
|
||
|
memcpy(work_bufer, prev_hist, sizeof(int32_t) * DCA_ADPCM_COEFFS);
|
||
|
|
||
|
for (i = 0; i < len; i++) {
|
||
|
work_bufer[DCA_ADPCM_COEFFS + i] = ff_dcaadpcm_predict(pred_vq_index, &work_bufer[i]);
|
||
|
|
||
|
delta = (int64_t)in[i] - ((int64_t)work_bufer[DCA_ADPCM_COEFFS + i] << 7);
|
||
|
|
||
|
out[i] = quantize_value(av_clip64(delta, -peak, peak), quant);
|
||
|
|
||
|
ff_dca_core_dequantize(&dequant_delta, &out[i], step_size, scale_factor, 0, 1);
|
||
|
|
||
|
work_bufer[DCA_ADPCM_COEFFS+i] += dequant_delta;
|
||
|
}
|
||
|
|
||
|
memcpy(next_hist, &work_bufer[len], sizeof(int32_t) * DCA_ADPCM_COEFFS);
|
||
|
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
av_cold int ff_dcaadpcm_init(DCAADPCMEncContext *s)
|
||
|
{
|
||
|
if (!s)
|
||
|
return -1;
|
||
|
|
||
|
s->private_data = av_malloc(sizeof(premultiplied_coeffs) * DCA_ADPCM_VQCODEBOOK_SZ);
|
||
|
if (!s->private_data)
|
||
|
return AVERROR(ENOMEM);
|
||
|
|
||
|
precalc(s->private_data);
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
av_cold void ff_dcaadpcm_free(DCAADPCMEncContext *s)
|
||
|
{
|
||
|
if (!s)
|
||
|
return;
|
||
|
|
||
|
av_freep(&s->private_data);
|
||
|
}
|