201 lines
6.0 KiB
C
201 lines
6.0 KiB
C
|
/*
|
||
|
* Opus decoder/demuxer common functions
|
||
|
* Copyright (c) 2012 Andrew D'Addesio
|
||
|
* Copyright (c) 2013-2014 Mozilla Corporation
|
||
|
*
|
||
|
* This file is part of FFmpeg.
|
||
|
*
|
||
|
* FFmpeg is free software; you can redistribute it and/or
|
||
|
* modify it under the terms of the GNU Lesser General Public
|
||
|
* License as published by the Free Software Foundation; either
|
||
|
* version 2.1 of the License, or (at your option) any later version.
|
||
|
*
|
||
|
* FFmpeg is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
* Lesser General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU Lesser General Public
|
||
|
* License along with FFmpeg; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
*/
|
||
|
|
||
|
#ifndef AVCODEC_OPUS_H
|
||
|
#define AVCODEC_OPUS_H
|
||
|
|
||
|
#include <stdint.h>
|
||
|
|
||
|
#include "libavutil/audio_fifo.h"
|
||
|
#include "libavutil/float_dsp.h"
|
||
|
#include "libavutil/frame.h"
|
||
|
|
||
|
#include "libswresample/swresample.h"
|
||
|
|
||
|
#include "avcodec.h"
|
||
|
#include "opus_rc.h"
|
||
|
|
||
|
#define MAX_FRAME_SIZE 1275
|
||
|
#define MAX_FRAMES 48
|
||
|
#define MAX_PACKET_DUR 5760
|
||
|
|
||
|
#define CELT_SHORT_BLOCKSIZE 120
|
||
|
#define CELT_OVERLAP CELT_SHORT_BLOCKSIZE
|
||
|
#define CELT_MAX_LOG_BLOCKS 3
|
||
|
#define CELT_MAX_FRAME_SIZE (CELT_SHORT_BLOCKSIZE * (1 << CELT_MAX_LOG_BLOCKS))
|
||
|
#define CELT_MAX_BANDS 21
|
||
|
|
||
|
#define SILK_HISTORY 322
|
||
|
#define SILK_MAX_LPC 16
|
||
|
|
||
|
#define ROUND_MULL(a,b,s) (((MUL64(a, b) >> ((s) - 1)) + 1) >> 1)
|
||
|
#define ROUND_MUL16(a,b) ((MUL16(a, b) + 16384) >> 15)
|
||
|
|
||
|
#define OPUS_TS_HEADER 0x7FE0 // 0x3ff (11 bits)
|
||
|
#define OPUS_TS_MASK 0xFFE0 // top 11 bits
|
||
|
|
||
|
static const uint8_t opus_default_extradata[30] = {
|
||
|
'O', 'p', 'u', 's', 'H', 'e', 'a', 'd',
|
||
|
1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
||
|
};
|
||
|
|
||
|
enum OpusMode {
|
||
|
OPUS_MODE_SILK,
|
||
|
OPUS_MODE_HYBRID,
|
||
|
OPUS_MODE_CELT,
|
||
|
|
||
|
OPUS_MODE_NB
|
||
|
};
|
||
|
|
||
|
enum OpusBandwidth {
|
||
|
OPUS_BANDWIDTH_NARROWBAND,
|
||
|
OPUS_BANDWIDTH_MEDIUMBAND,
|
||
|
OPUS_BANDWIDTH_WIDEBAND,
|
||
|
OPUS_BANDWIDTH_SUPERWIDEBAND,
|
||
|
OPUS_BANDWIDTH_FULLBAND,
|
||
|
|
||
|
OPUS_BANDWITH_NB
|
||
|
};
|
||
|
|
||
|
typedef struct SilkContext SilkContext;
|
||
|
|
||
|
typedef struct CeltFrame CeltFrame;
|
||
|
|
||
|
typedef struct OpusPacket {
|
||
|
int packet_size; /**< packet size */
|
||
|
int data_size; /**< size of the useful data -- packet size - padding */
|
||
|
int code; /**< packet code: specifies the frame layout */
|
||
|
int stereo; /**< whether this packet is mono or stereo */
|
||
|
int vbr; /**< vbr flag */
|
||
|
int config; /**< configuration: tells the audio mode,
|
||
|
** bandwidth, and frame duration */
|
||
|
int frame_count; /**< frame count */
|
||
|
int frame_offset[MAX_FRAMES]; /**< frame offsets */
|
||
|
int frame_size[MAX_FRAMES]; /**< frame sizes */
|
||
|
int frame_duration; /**< frame duration, in samples @ 48kHz */
|
||
|
enum OpusMode mode; /**< mode */
|
||
|
enum OpusBandwidth bandwidth; /**< bandwidth */
|
||
|
} OpusPacket;
|
||
|
|
||
|
typedef struct OpusStreamContext {
|
||
|
AVCodecContext *avctx;
|
||
|
int output_channels;
|
||
|
|
||
|
OpusRangeCoder rc;
|
||
|
OpusRangeCoder redundancy_rc;
|
||
|
SilkContext *silk;
|
||
|
CeltFrame *celt;
|
||
|
AVFloatDSPContext *fdsp;
|
||
|
|
||
|
float silk_buf[2][960];
|
||
|
float *silk_output[2];
|
||
|
DECLARE_ALIGNED(32, float, celt_buf)[2][960];
|
||
|
float *celt_output[2];
|
||
|
|
||
|
DECLARE_ALIGNED(32, float, redundancy_buf)[2][960];
|
||
|
float *redundancy_output[2];
|
||
|
|
||
|
/* data buffers for the final output data */
|
||
|
float *out[2];
|
||
|
int out_size;
|
||
|
|
||
|
float *out_dummy;
|
||
|
int out_dummy_allocated_size;
|
||
|
|
||
|
SwrContext *swr;
|
||
|
AVAudioFifo *celt_delay;
|
||
|
int silk_samplerate;
|
||
|
/* number of samples we still want to get from the resampler */
|
||
|
int delayed_samples;
|
||
|
|
||
|
OpusPacket packet;
|
||
|
|
||
|
int redundancy_idx;
|
||
|
} OpusStreamContext;
|
||
|
|
||
|
// a mapping between an opus stream and an output channel
|
||
|
typedef struct ChannelMap {
|
||
|
int stream_idx;
|
||
|
int channel_idx;
|
||
|
|
||
|
// when a single decoded channel is mapped to multiple output channels, we
|
||
|
// write to the first output directly and copy from it to the others
|
||
|
// this field is set to 1 for those copied output channels
|
||
|
int copy;
|
||
|
// this is the index of the output channel to copy from
|
||
|
int copy_idx;
|
||
|
|
||
|
// this channel is silent
|
||
|
int silence;
|
||
|
} ChannelMap;
|
||
|
|
||
|
typedef struct OpusContext {
|
||
|
AVClass *av_class;
|
||
|
OpusStreamContext *streams;
|
||
|
int apply_phase_inv;
|
||
|
|
||
|
/* current output buffers for each streams */
|
||
|
float **out;
|
||
|
int *out_size;
|
||
|
/* Buffers for synchronizing the streams when they have different
|
||
|
* resampling delays */
|
||
|
AVAudioFifo **sync_buffers;
|
||
|
/* number of decoded samples for each stream */
|
||
|
int *decoded_samples;
|
||
|
|
||
|
int nb_streams;
|
||
|
int nb_stereo_streams;
|
||
|
|
||
|
AVFloatDSPContext *fdsp;
|
||
|
int16_t gain_i;
|
||
|
float gain;
|
||
|
|
||
|
ChannelMap *channel_maps;
|
||
|
} OpusContext;
|
||
|
|
||
|
int ff_opus_parse_packet(OpusPacket *pkt, const uint8_t *buf, int buf_size,
|
||
|
int self_delimited);
|
||
|
|
||
|
int ff_opus_parse_extradata(AVCodecContext *avctx, OpusContext *s);
|
||
|
|
||
|
int ff_silk_init(AVCodecContext *avctx, SilkContext **ps, int output_channels);
|
||
|
void ff_silk_free(SilkContext **ps);
|
||
|
void ff_silk_flush(SilkContext *s);
|
||
|
|
||
|
/**
|
||
|
* Decode the LP layer of one Opus frame (which may correspond to several SILK
|
||
|
* frames).
|
||
|
*/
|
||
|
int ff_silk_decode_superframe(SilkContext *s, OpusRangeCoder *rc,
|
||
|
float *output[2],
|
||
|
enum OpusBandwidth bandwidth, int coded_channels,
|
||
|
int duration_ms);
|
||
|
|
||
|
/* Encode or decode CELT bands */
|
||
|
void ff_celt_quant_bands(CeltFrame *f, OpusRangeCoder *rc);
|
||
|
|
||
|
/* Encode or decode CELT bitallocation */
|
||
|
void ff_celt_bitalloc(CeltFrame *f, OpusRangeCoder *rc, int encode);
|
||
|
|
||
|
#endif /* AVCODEC_OPUS_H */
|