220 lines
7.5 KiB
C
220 lines
7.5 KiB
C
|
/*
|
||
|
* RTP Depacketization of QCELP/PureVoice, RFC 2658
|
||
|
* Copyright (c) 2010 Martin Storsjo
|
||
|
*
|
||
|
* This file is part of FFmpeg.
|
||
|
*
|
||
|
* FFmpeg is free software; you can redistribute it and/or
|
||
|
* modify it under the terms of the GNU Lesser General Public
|
||
|
* License as published by the Free Software Foundation; either
|
||
|
* version 2.1 of the License, or (at your option) any later version.
|
||
|
*
|
||
|
* FFmpeg is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
* Lesser General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU Lesser General Public
|
||
|
* License along with FFmpeg; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
*/
|
||
|
|
||
|
#include "rtpdec_formats.h"
|
||
|
|
||
|
static const uint8_t frame_sizes[] = {
|
||
|
1, 4, 8, 17, 35
|
||
|
};
|
||
|
|
||
|
typedef struct InterleavePacket {
|
||
|
int pos;
|
||
|
int size;
|
||
|
/* The largest frame is 35 bytes, only 10 frames are allowed per
|
||
|
* packet, and we return the first one immediately, so allocate
|
||
|
* space for 9 frames */
|
||
|
uint8_t data[35*9];
|
||
|
} InterleavePacket;
|
||
|
|
||
|
struct PayloadContext {
|
||
|
int interleave_size;
|
||
|
int interleave_index;
|
||
|
InterleavePacket group[6];
|
||
|
int group_finished;
|
||
|
|
||
|
/* The maximum packet size, 10 frames of 35 bytes each, and one
|
||
|
* packet header byte. */
|
||
|
uint8_t next_data[1 + 35*10];
|
||
|
int next_size;
|
||
|
uint32_t next_timestamp;
|
||
|
};
|
||
|
|
||
|
static int return_stored_frame(AVFormatContext *ctx, PayloadContext *data,
|
||
|
AVStream *st, AVPacket *pkt, uint32_t *timestamp,
|
||
|
const uint8_t *buf, int len);
|
||
|
|
||
|
static int store_packet(AVFormatContext *ctx, PayloadContext *data,
|
||
|
AVStream *st, AVPacket *pkt, uint32_t *timestamp,
|
||
|
const uint8_t *buf, int len)
|
||
|
{
|
||
|
int interleave_size, interleave_index;
|
||
|
int frame_size, ret;
|
||
|
InterleavePacket* ip;
|
||
|
|
||
|
if (len < 2)
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
|
||
|
interleave_size = buf[0] >> 3 & 7;
|
||
|
interleave_index = buf[0] & 7;
|
||
|
|
||
|
if (interleave_size > 5) {
|
||
|
av_log(ctx, AV_LOG_ERROR, "Invalid interleave size %d\n",
|
||
|
interleave_size);
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
}
|
||
|
if (interleave_index > interleave_size) {
|
||
|
av_log(ctx, AV_LOG_ERROR, "Invalid interleave index %d/%d\n",
|
||
|
interleave_index, interleave_size);
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
}
|
||
|
if (interleave_size != data->interleave_size) {
|
||
|
int i;
|
||
|
/* First packet, or changed interleave size */
|
||
|
data->interleave_size = interleave_size;
|
||
|
data->interleave_index = 0;
|
||
|
for (i = 0; i < 6; i++)
|
||
|
data->group[i].size = 0;
|
||
|
}
|
||
|
|
||
|
if (interleave_index < data->interleave_index) {
|
||
|
/* Wrapped around - missed the last packet of the previous group. */
|
||
|
if (data->group_finished) {
|
||
|
/* No more data in the packets in this interleaving group, just
|
||
|
* start processing the next one */
|
||
|
data->interleave_index = 0;
|
||
|
} else {
|
||
|
/* Stash away the current packet, emit everything we have of the
|
||
|
* previous group. */
|
||
|
for (; data->interleave_index <= interleave_size;
|
||
|
data->interleave_index++)
|
||
|
data->group[data->interleave_index].size = 0;
|
||
|
|
||
|
if (len > sizeof(data->next_data))
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
memcpy(data->next_data, buf, len);
|
||
|
data->next_size = len;
|
||
|
data->next_timestamp = *timestamp;
|
||
|
*timestamp = RTP_NOTS_VALUE;
|
||
|
|
||
|
data->interleave_index = 0;
|
||
|
return return_stored_frame(ctx, data, st, pkt, timestamp, buf, len);
|
||
|
}
|
||
|
}
|
||
|
if (interleave_index > data->interleave_index) {
|
||
|
/* We missed a packet */
|
||
|
for (; data->interleave_index < interleave_index;
|
||
|
data->interleave_index++)
|
||
|
data->group[data->interleave_index].size = 0;
|
||
|
}
|
||
|
data->interleave_index = interleave_index;
|
||
|
|
||
|
if (buf[1] >= FF_ARRAY_ELEMS(frame_sizes))
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
frame_size = frame_sizes[buf[1]];
|
||
|
if (1 + frame_size > len)
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
|
||
|
if (len - 1 - frame_size > sizeof(data->group[0].data))
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
|
||
|
if ((ret = av_new_packet(pkt, frame_size)) < 0)
|
||
|
return ret;
|
||
|
memcpy(pkt->data, &buf[1], frame_size);
|
||
|
pkt->stream_index = st->index;
|
||
|
|
||
|
ip = &data->group[data->interleave_index];
|
||
|
ip->size = len - 1 - frame_size;
|
||
|
ip->pos = 0;
|
||
|
memcpy(ip->data, &buf[1 + frame_size], ip->size);
|
||
|
/* Each packet must contain the same number of frames according to the
|
||
|
* RFC. If there's no data left in this packet, there shouldn't be any
|
||
|
* in any of the other frames in the interleaving group either. */
|
||
|
data->group_finished = ip->size == 0;
|
||
|
|
||
|
if (interleave_index == interleave_size) {
|
||
|
data->interleave_index = 0;
|
||
|
return !data->group_finished;
|
||
|
} else {
|
||
|
data->interleave_index++;
|
||
|
return 0;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
static int return_stored_frame(AVFormatContext *ctx, PayloadContext *data,
|
||
|
AVStream *st, AVPacket *pkt, uint32_t *timestamp,
|
||
|
const uint8_t *buf, int len)
|
||
|
{
|
||
|
InterleavePacket* ip = &data->group[data->interleave_index];
|
||
|
int frame_size, ret;
|
||
|
|
||
|
if (data->group_finished && data->interleave_index == 0) {
|
||
|
*timestamp = data->next_timestamp;
|
||
|
ret = store_packet(ctx, data, st, pkt, timestamp, data->next_data,
|
||
|
data->next_size);
|
||
|
data->next_size = 0;
|
||
|
return ret;
|
||
|
}
|
||
|
|
||
|
if (ip->size == 0) {
|
||
|
/* No stored data for this interleave block, output an empty packet */
|
||
|
if ((ret = av_new_packet(pkt, 1)) < 0)
|
||
|
return ret;
|
||
|
pkt->data[0] = 0; // Blank - could also be 14, Erasure
|
||
|
} else {
|
||
|
if (ip->pos >= ip->size)
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
if (ip->data[ip->pos] >= FF_ARRAY_ELEMS(frame_sizes))
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
frame_size = frame_sizes[ip->data[ip->pos]];
|
||
|
if (ip->pos + frame_size > ip->size)
|
||
|
return AVERROR_INVALIDDATA;
|
||
|
|
||
|
if ((ret = av_new_packet(pkt, frame_size)) < 0)
|
||
|
return ret;
|
||
|
memcpy(pkt->data, &ip->data[ip->pos], frame_size);
|
||
|
|
||
|
ip->pos += frame_size;
|
||
|
data->group_finished = ip->pos >= ip->size;
|
||
|
}
|
||
|
pkt->stream_index = st->index;
|
||
|
|
||
|
if (data->interleave_index == data->interleave_size) {
|
||
|
data->interleave_index = 0;
|
||
|
if (!data->group_finished)
|
||
|
return 1;
|
||
|
else
|
||
|
return data->next_size > 0;
|
||
|
} else {
|
||
|
data->interleave_index++;
|
||
|
return 1;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
static int qcelp_parse_packet(AVFormatContext *ctx, PayloadContext *data,
|
||
|
AVStream *st, AVPacket *pkt, uint32_t *timestamp,
|
||
|
const uint8_t *buf, int len, uint16_t seq,
|
||
|
int flags)
|
||
|
{
|
||
|
if (buf)
|
||
|
return store_packet(ctx, data, st, pkt, timestamp, buf, len);
|
||
|
else
|
||
|
return return_stored_frame(ctx, data, st, pkt, timestamp, buf, len);
|
||
|
}
|
||
|
|
||
|
const RTPDynamicProtocolHandler ff_qcelp_dynamic_handler = {
|
||
|
.enc_name = "x-Purevoice",
|
||
|
.codec_type = AVMEDIA_TYPE_AUDIO,
|
||
|
.codec_id = AV_CODEC_ID_QCELP,
|
||
|
.priv_data_size = sizeof(PayloadContext),
|
||
|
.static_payload_id = 12,
|
||
|
.parse_packet = qcelp_parse_packet,
|
||
|
};
|