213 lines
6.8 KiB
C
213 lines
6.8 KiB
C
|
/*
|
||
|
* Copyright (c) 2012 Clément Bœsch
|
||
|
*
|
||
|
* This file is part of FFmpeg.
|
||
|
*
|
||
|
* FFmpeg is free software; you can redistribute it and/or
|
||
|
* modify it under the terms of the GNU Lesser General Public
|
||
|
* License as published by the Free Software Foundation; either
|
||
|
* version 2.1 of the License, or (at your option) any later version.
|
||
|
*
|
||
|
* FFmpeg is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
* Lesser General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU Lesser General Public
|
||
|
* License along with FFmpeg; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
*/
|
||
|
|
||
|
#ifndef AVFORMAT_SUBTITLES_H
|
||
|
#define AVFORMAT_SUBTITLES_H
|
||
|
|
||
|
#include <stdint.h>
|
||
|
#include <stddef.h>
|
||
|
#include "avformat.h"
|
||
|
#include "libavutil/bprint.h"
|
||
|
|
||
|
enum sub_sort {
|
||
|
SUB_SORT_TS_POS = 0, ///< sort by timestamps, then position
|
||
|
SUB_SORT_POS_TS, ///< sort by position, then timestamps
|
||
|
};
|
||
|
|
||
|
enum ff_utf_type {
|
||
|
FF_UTF_8, // or other 8 bit encodings
|
||
|
FF_UTF16LE,
|
||
|
FF_UTF16BE,
|
||
|
};
|
||
|
|
||
|
typedef struct {
|
||
|
int type;
|
||
|
AVIOContext *pb;
|
||
|
unsigned char buf[8];
|
||
|
int buf_pos, buf_len;
|
||
|
AVIOContext buf_pb;
|
||
|
} FFTextReader;
|
||
|
|
||
|
/**
|
||
|
* Initialize the FFTextReader from the given AVIOContext. This function will
|
||
|
* read some bytes from pb, and test for UTF-8 or UTF-16 BOMs. Further accesses
|
||
|
* to FFTextReader will read more data from pb.
|
||
|
* If s is not NULL, the user will be warned if a UTF-16 conversion takes place.
|
||
|
*
|
||
|
* The purpose of FFTextReader is to transparently convert read data to UTF-8
|
||
|
* if the stream had a UTF-16 BOM.
|
||
|
*
|
||
|
* @param s Pointer to provide av_log context
|
||
|
* @param r object which will be initialized
|
||
|
* @param pb stream to read from (referenced as long as FFTextReader is in use)
|
||
|
*/
|
||
|
void ff_text_init_avio(void *s, FFTextReader *r, AVIOContext *pb);
|
||
|
|
||
|
/**
|
||
|
* Similar to ff_text_init_avio(), but sets it up to read from a bounded buffer.
|
||
|
*
|
||
|
* @param r object which will be initialized
|
||
|
* @param buf buffer to read from (referenced as long as FFTextReader is in use)
|
||
|
* @param size size of buf
|
||
|
*/
|
||
|
void ff_text_init_buf(FFTextReader *r, void *buf, size_t size);
|
||
|
|
||
|
/**
|
||
|
* Return the byte position of the next byte returned by ff_text_r8(). For
|
||
|
* UTF-16 source streams, this will return the original position, but it will
|
||
|
* be incorrect if a codepoint was only partially read with ff_text_r8().
|
||
|
*/
|
||
|
int64_t ff_text_pos(FFTextReader *r);
|
||
|
|
||
|
/**
|
||
|
* Return the next byte. The return value is always 0 - 255. Returns 0 on EOF.
|
||
|
* If the source stream is UTF-16, this reads from the stream converted to
|
||
|
* UTF-8. On invalid UTF-16, 0 is returned.
|
||
|
*/
|
||
|
int ff_text_r8(FFTextReader *r);
|
||
|
|
||
|
/**
|
||
|
* Return non-zero if EOF was reached.
|
||
|
*/
|
||
|
int ff_text_eof(FFTextReader *r);
|
||
|
|
||
|
/**
|
||
|
* Like ff_text_r8(), but don't remove the byte from the buffer.
|
||
|
*/
|
||
|
int ff_text_peek_r8(FFTextReader *r);
|
||
|
|
||
|
/**
|
||
|
* Read the given number of bytes (in UTF-8). On error or EOF, \0 bytes are
|
||
|
* written.
|
||
|
*/
|
||
|
void ff_text_read(FFTextReader *r, char *buf, size_t size);
|
||
|
|
||
|
typedef struct {
|
||
|
AVPacket *subs; ///< array of subtitles packets
|
||
|
int nb_subs; ///< number of subtitles packets
|
||
|
int allocated_size; ///< allocated size for subs
|
||
|
int current_sub_idx; ///< current position for the read packet callback
|
||
|
enum sub_sort sort; ///< sort method to use when finalizing subtitles
|
||
|
int keep_duplicates; ///< set to 1 to keep duplicated subtitle events
|
||
|
} FFDemuxSubtitlesQueue;
|
||
|
|
||
|
/**
|
||
|
* Insert a new subtitle event.
|
||
|
*
|
||
|
* @param event the subtitle line, may not be zero terminated
|
||
|
* @param len the length of the event (in strlen() sense, so without '\0')
|
||
|
* @param merge set to 1 if the current event should be concatenated with the
|
||
|
* previous one instead of adding a new entry, 0 otherwise
|
||
|
*/
|
||
|
AVPacket *ff_subtitles_queue_insert(FFDemuxSubtitlesQueue *q,
|
||
|
const uint8_t *event, size_t len, int merge);
|
||
|
|
||
|
/**
|
||
|
* Set missing durations, sort subtitles by PTS (and then byte position), and
|
||
|
* drop duplicated events.
|
||
|
*/
|
||
|
void ff_subtitles_queue_finalize(void *log_ctx, FFDemuxSubtitlesQueue *q);
|
||
|
|
||
|
/**
|
||
|
* Generic read_packet() callback for subtitles demuxers using this queue
|
||
|
* system.
|
||
|
*/
|
||
|
int ff_subtitles_queue_read_packet(FFDemuxSubtitlesQueue *q, AVPacket *pkt);
|
||
|
|
||
|
/**
|
||
|
* Update current_sub_idx to emulate a seek. Except the first parameter, it
|
||
|
* matches AVInputFormat->read_seek2 prototypes.
|
||
|
*/
|
||
|
int ff_subtitles_queue_seek(FFDemuxSubtitlesQueue *q, AVFormatContext *s, int stream_index,
|
||
|
int64_t min_ts, int64_t ts, int64_t max_ts, int flags);
|
||
|
|
||
|
/**
|
||
|
* Remove and destroy all the subtitles packets.
|
||
|
*/
|
||
|
void ff_subtitles_queue_clean(FFDemuxSubtitlesQueue *q);
|
||
|
|
||
|
/**
|
||
|
* SMIL helper to load next chunk ("<...>" or untagged content) in buf.
|
||
|
*
|
||
|
* @param c cached character, to avoid a backward seek
|
||
|
*/
|
||
|
int ff_smil_extract_next_text_chunk(FFTextReader *tr, AVBPrint *buf, char *c);
|
||
|
|
||
|
/**
|
||
|
* SMIL helper to point on the value of an attribute in the given tag.
|
||
|
*
|
||
|
* @param s SMIL tag ("<...>")
|
||
|
* @param attr the attribute to look for
|
||
|
*/
|
||
|
const char *ff_smil_get_attr_ptr(const char *s, const char *attr);
|
||
|
|
||
|
/**
|
||
|
* @brief Same as ff_subtitles_read_text_chunk(), but read from an AVIOContext.
|
||
|
*/
|
||
|
void ff_subtitles_read_chunk(AVIOContext *pb, AVBPrint *buf);
|
||
|
|
||
|
/**
|
||
|
* @brief Read a subtitles chunk from FFTextReader.
|
||
|
*
|
||
|
* A chunk is defined by a multiline "event", ending with a second line break.
|
||
|
* The trailing line breaks are trimmed. CRLF are supported.
|
||
|
* Example: "foo\r\nbar\r\n\r\nnext" will print "foo\r\nbar" into buf, and pb
|
||
|
* will focus on the 'n' of the "next" string.
|
||
|
*
|
||
|
* @param tr I/O context
|
||
|
* @param buf an initialized buf where the chunk is written
|
||
|
*
|
||
|
* @note buf is cleared before writing into it.
|
||
|
*/
|
||
|
void ff_subtitles_read_text_chunk(FFTextReader *tr, AVBPrint *buf);
|
||
|
|
||
|
/**
|
||
|
* Get the number of characters to increment to jump to the next line, or to
|
||
|
* the end of the string.
|
||
|
* The function handles the following line breaks schemes:
|
||
|
* LF, CRLF (MS), or standalone CR (old MacOS).
|
||
|
*/
|
||
|
static av_always_inline int ff_subtitles_next_line(const char *ptr)
|
||
|
{
|
||
|
int n = strcspn(ptr, "\r\n");
|
||
|
ptr += n;
|
||
|
while (*ptr == '\r') {
|
||
|
ptr++;
|
||
|
n++;
|
||
|
}
|
||
|
if (*ptr == '\n')
|
||
|
n++;
|
||
|
return n;
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* Read a line of text. Discards line ending characters.
|
||
|
* The function handles the following line breaks schemes:
|
||
|
* LF, CRLF (MS), or standalone CR (old MacOS).
|
||
|
*
|
||
|
* Returns the number of bytes written to buf. Always writes a terminating 0,
|
||
|
* similar as with snprintf.
|
||
|
*
|
||
|
* @note returns a negative error code if a \0 byte is found
|
||
|
*/
|
||
|
ptrdiff_t ff_subtitles_read_line(FFTextReader *tr, char *buf, size_t size);
|
||
|
|
||
|
#endif /* AVFORMAT_SUBTITLES_H */
|