mirror of
https://github.com/nyanmisaka/ffmpeg-rockchip.git
synced 2025-10-24 17:32:22 +08:00

Signed-off-by: Vittorio Giovara <vittorio.giovara@gmail.com> Signed-off-by: James Almer <jamrial@gmail.com>
409 lines
13 KiB
C
409 lines
13 KiB
C
/*
|
|
* 4X Technologies .4xm File Demuxer (no muxer)
|
|
* Copyright (c) 2003 The FFmpeg project
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
* 4X Technologies file demuxer
|
|
* by Mike Melanson (melanson@pcisys.net)
|
|
* for more information on the .4xm file format, visit:
|
|
* http://www.pcisys.net/~melanson/codecs/
|
|
*/
|
|
|
|
#include "libavutil/intreadwrite.h"
|
|
#include "libavutil/intfloat.h"
|
|
#include "libavcodec/internal.h"
|
|
#include "avformat.h"
|
|
#include "internal.h"
|
|
|
|
#define RIFF_TAG MKTAG('R', 'I', 'F', 'F')
|
|
#define FOURXMV_TAG MKTAG('4', 'X', 'M', 'V')
|
|
#define LIST_TAG MKTAG('L', 'I', 'S', 'T')
|
|
#define HEAD_TAG MKTAG('H', 'E', 'A', 'D')
|
|
#define TRK__TAG MKTAG('T', 'R', 'K', '_')
|
|
#define MOVI_TAG MKTAG('M', 'O', 'V', 'I')
|
|
#define VTRK_TAG MKTAG('V', 'T', 'R', 'K')
|
|
#define STRK_TAG MKTAG('S', 'T', 'R', 'K')
|
|
#define std__TAG MKTAG('s', 't', 'd', '_')
|
|
#define name_TAG MKTAG('n', 'a', 'm', 'e')
|
|
#define vtrk_TAG MKTAG('v', 't', 'r', 'k')
|
|
#define strk_TAG MKTAG('s', 't', 'r', 'k')
|
|
#define ifrm_TAG MKTAG('i', 'f', 'r', 'm')
|
|
#define pfrm_TAG MKTAG('p', 'f', 'r', 'm')
|
|
#define cfrm_TAG MKTAG('c', 'f', 'r', 'm')
|
|
#define ifr2_TAG MKTAG('i', 'f', 'r', '2')
|
|
#define pfr2_TAG MKTAG('p', 'f', 'r', '2')
|
|
#define cfr2_TAG MKTAG('c', 'f', 'r', '2')
|
|
#define snd__TAG MKTAG('s', 'n', 'd', '_')
|
|
|
|
#define vtrk_SIZE 0x44
|
|
#define strk_SIZE 0x28
|
|
|
|
#define GET_LIST_HEADER() \
|
|
fourcc_tag = avio_rl32(pb); \
|
|
size = avio_rl32(pb); \
|
|
if (fourcc_tag != LIST_TAG) { \
|
|
ret = AVERROR_INVALIDDATA; \
|
|
goto fail; \
|
|
} \
|
|
fourcc_tag = avio_rl32(pb);
|
|
|
|
typedef struct AudioTrack {
|
|
int sample_rate;
|
|
int bits;
|
|
int channels;
|
|
int stream_index;
|
|
int adpcm;
|
|
int64_t audio_pts;
|
|
} AudioTrack;
|
|
|
|
typedef struct FourxmDemuxContext {
|
|
int video_stream_index;
|
|
int track_count;
|
|
AudioTrack *tracks;
|
|
|
|
int64_t video_pts;
|
|
AVRational fps;
|
|
} FourxmDemuxContext;
|
|
|
|
static int fourxm_probe(const AVProbeData *p)
|
|
{
|
|
if ((AV_RL32(&p->buf[0]) != RIFF_TAG) ||
|
|
(AV_RL32(&p->buf[8]) != FOURXMV_TAG))
|
|
return 0;
|
|
|
|
return AVPROBE_SCORE_MAX;
|
|
}
|
|
|
|
static int parse_vtrk(AVFormatContext *s,
|
|
FourxmDemuxContext *fourxm, uint8_t *buf, int size,
|
|
int left)
|
|
{
|
|
AVStream *st;
|
|
/* check that there is enough data */
|
|
if (size != vtrk_SIZE || left < size + 8) {
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
|
|
/* allocate a new AVStream */
|
|
st = avformat_new_stream(s, NULL);
|
|
if (!st)
|
|
return AVERROR(ENOMEM);
|
|
|
|
avpriv_set_pts_info(st, 60, fourxm->fps.den, fourxm->fps.num);
|
|
|
|
fourxm->video_stream_index = st->index;
|
|
|
|
st->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
|
|
st->codecpar->codec_id = AV_CODEC_ID_4XM;
|
|
|
|
st->codecpar->extradata = av_mallocz(4 + AV_INPUT_BUFFER_PADDING_SIZE);
|
|
if (!st->codecpar->extradata)
|
|
return AVERROR(ENOMEM);
|
|
st->codecpar->extradata_size = 4;
|
|
AV_WL32(st->codecpar->extradata, AV_RL32(buf + 16));
|
|
st->codecpar->width = AV_RL32(buf + 36);
|
|
st->codecpar->height = AV_RL32(buf + 40);
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
static int parse_strk(AVFormatContext *s,
|
|
FourxmDemuxContext *fourxm, uint8_t *buf, int size,
|
|
int left)
|
|
{
|
|
AVStream *st;
|
|
int track;
|
|
/* check that there is enough data */
|
|
if (size != strk_SIZE || left < size + 8)
|
|
return AVERROR_INVALIDDATA;
|
|
|
|
track = AV_RL32(buf + 8);
|
|
if ((unsigned)track >= UINT_MAX / sizeof(AudioTrack) - 1 ||
|
|
track >= s->max_streams) {
|
|
av_log(s, AV_LOG_ERROR, "current_track too large\n");
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
|
|
if (track + 1 > fourxm->track_count) {
|
|
if (av_reallocp_array(&fourxm->tracks, track + 1, sizeof(AudioTrack)))
|
|
return AVERROR(ENOMEM);
|
|
memset(&fourxm->tracks[fourxm->track_count], 0,
|
|
sizeof(AudioTrack) * (track + 1 - fourxm->track_count));
|
|
fourxm->track_count = track + 1;
|
|
} else {
|
|
if (fourxm->tracks[track].bits)
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
fourxm->tracks[track].adpcm = AV_RL32(buf + 12);
|
|
fourxm->tracks[track].channels = AV_RL32(buf + 36);
|
|
fourxm->tracks[track].sample_rate = AV_RL32(buf + 40);
|
|
fourxm->tracks[track].bits = AV_RL32(buf + 44);
|
|
fourxm->tracks[track].audio_pts = 0;
|
|
|
|
if (fourxm->tracks[track].channels <= 0 ||
|
|
fourxm->tracks[track].channels > FF_SANE_NB_CHANNELS ||
|
|
fourxm->tracks[track].sample_rate <= 0 ||
|
|
fourxm->tracks[track].bits <= 0 ||
|
|
fourxm->tracks[track].bits > INT_MAX / FF_SANE_NB_CHANNELS) {
|
|
av_log(s, AV_LOG_ERROR, "audio header invalid\n");
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
if (!fourxm->tracks[track].adpcm && fourxm->tracks[track].bits<8) {
|
|
av_log(s, AV_LOG_ERROR, "bits unspecified for non ADPCM\n");
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
|
|
if (fourxm->tracks[track].sample_rate > INT64_MAX / fourxm->tracks[track].bits / fourxm->tracks[track].channels) {
|
|
av_log(s, AV_LOG_ERROR, "Overflow during bit rate calculation %d * %d * %d\n",
|
|
fourxm->tracks[track].sample_rate, fourxm->tracks[track].bits, fourxm->tracks[track].channels);
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
|
|
/* allocate a new AVStream */
|
|
st = avformat_new_stream(s, NULL);
|
|
if (!st)
|
|
return AVERROR(ENOMEM);
|
|
|
|
st->id = track;
|
|
avpriv_set_pts_info(st, 60, 1, fourxm->tracks[track].sample_rate);
|
|
|
|
fourxm->tracks[track].stream_index = st->index;
|
|
|
|
st->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
|
|
st->codecpar->codec_tag = 0;
|
|
st->codecpar->ch_layout.nb_channels = fourxm->tracks[track].channels;
|
|
st->codecpar->sample_rate = fourxm->tracks[track].sample_rate;
|
|
st->codecpar->bits_per_coded_sample = fourxm->tracks[track].bits;
|
|
st->codecpar->bit_rate = (int64_t)st->codecpar->ch_layout.nb_channels *
|
|
st->codecpar->sample_rate *
|
|
st->codecpar->bits_per_coded_sample;
|
|
st->codecpar->block_align = st->codecpar->ch_layout.nb_channels *
|
|
st->codecpar->bits_per_coded_sample;
|
|
|
|
if (fourxm->tracks[track].adpcm){
|
|
st->codecpar->codec_id = AV_CODEC_ID_ADPCM_4XM;
|
|
} else if (st->codecpar->bits_per_coded_sample == 8) {
|
|
st->codecpar->codec_id = AV_CODEC_ID_PCM_U8;
|
|
} else
|
|
st->codecpar->codec_id = AV_CODEC_ID_PCM_S16LE;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int fourxm_read_header(AVFormatContext *s)
|
|
{
|
|
AVIOContext *pb = s->pb;
|
|
unsigned int fourcc_tag;
|
|
unsigned int size;
|
|
int header_size;
|
|
FourxmDemuxContext *fourxm = s->priv_data;
|
|
unsigned char *header = NULL;
|
|
int i, ret;
|
|
|
|
fourxm->track_count = 0;
|
|
fourxm->tracks = NULL;
|
|
fourxm->fps = (AVRational){1,1};
|
|
fourxm->video_stream_index = -1;
|
|
|
|
/* skip the first 3 32-bit numbers */
|
|
avio_skip(pb, 12);
|
|
|
|
/* check for LIST-HEAD */
|
|
GET_LIST_HEADER();
|
|
header_size = size - 4;
|
|
if (fourcc_tag != HEAD_TAG || header_size < 0)
|
|
return AVERROR_INVALIDDATA;
|
|
|
|
/* allocate space for the header and load the whole thing */
|
|
header = av_malloc(header_size);
|
|
if (!header)
|
|
return AVERROR(ENOMEM);
|
|
if (avio_read(pb, header, header_size) != header_size) {
|
|
av_free(header);
|
|
return AVERROR(EIO);
|
|
}
|
|
|
|
/* take the lazy approach and search for any and all vtrk and strk chunks */
|
|
for (i = 0; i < header_size - 8; i++) {
|
|
fourcc_tag = AV_RL32(&header[i]);
|
|
size = AV_RL32(&header[i + 4]);
|
|
if (size > header_size - i - 8 && (fourcc_tag == vtrk_TAG || fourcc_tag == strk_TAG)) {
|
|
av_log(s, AV_LOG_ERROR, "chunk larger than array %d>%d\n", size, header_size - i - 8);
|
|
ret = AVERROR_INVALIDDATA;
|
|
goto fail;
|
|
}
|
|
|
|
if (fourcc_tag == std__TAG) {
|
|
if (header_size - i < 16) {
|
|
av_log(s, AV_LOG_ERROR, "std TAG truncated\n");
|
|
ret = AVERROR_INVALIDDATA;
|
|
goto fail;
|
|
}
|
|
fourxm->fps = av_d2q(av_int2float(AV_RL32(&header[i + 12])), 10000);
|
|
} else if (fourcc_tag == vtrk_TAG) {
|
|
if ((ret = parse_vtrk(s, fourxm, header + i, size,
|
|
header_size - i)) < 0)
|
|
goto fail;
|
|
|
|
i += 8 + size;
|
|
} else if (fourcc_tag == strk_TAG) {
|
|
if ((ret = parse_strk(s, fourxm, header + i, size,
|
|
header_size - i)) < 0)
|
|
goto fail;
|
|
|
|
i += 8 + size;
|
|
}
|
|
}
|
|
|
|
/* skip over the LIST-MOVI chunk (which is where the stream should be */
|
|
GET_LIST_HEADER();
|
|
if (fourcc_tag != MOVI_TAG) {
|
|
ret = AVERROR_INVALIDDATA;
|
|
goto fail;
|
|
}
|
|
|
|
av_free(header);
|
|
/* initialize context members */
|
|
fourxm->video_pts = -1; /* first frame will push to 0 */
|
|
|
|
return 0;
|
|
fail:
|
|
av_free(header);
|
|
return ret;
|
|
}
|
|
|
|
static int fourxm_read_packet(AVFormatContext *s,
|
|
AVPacket *pkt)
|
|
{
|
|
FourxmDemuxContext *fourxm = s->priv_data;
|
|
AVIOContext *pb = s->pb;
|
|
unsigned int fourcc_tag;
|
|
unsigned int size;
|
|
int ret = 0;
|
|
unsigned int track_number;
|
|
int packet_read = 0;
|
|
unsigned char header[8];
|
|
int64_t audio_frame_count;
|
|
|
|
while (!packet_read) {
|
|
if ((ret = avio_read(s->pb, header, 8)) < 0)
|
|
return ret;
|
|
fourcc_tag = AV_RL32(&header[0]);
|
|
size = AV_RL32(&header[4]);
|
|
if (avio_feof(pb))
|
|
return AVERROR(EIO);
|
|
switch (fourcc_tag) {
|
|
case LIST_TAG:
|
|
/* this is a good time to bump the video pts */
|
|
fourxm->video_pts++;
|
|
|
|
/* skip the LIST-* tag and move on to the next fourcc */
|
|
avio_rl32(pb);
|
|
break;
|
|
|
|
case ifrm_TAG:
|
|
case pfrm_TAG:
|
|
case cfrm_TAG:
|
|
case ifr2_TAG:
|
|
case pfr2_TAG:
|
|
case cfr2_TAG:
|
|
/* allocate 8 more bytes than 'size' to account for fourcc
|
|
* and size */
|
|
if (size > INT_MAX - AV_INPUT_BUFFER_PADDING_SIZE - 8)
|
|
return AVERROR_INVALIDDATA;
|
|
if (fourxm->video_stream_index < 0)
|
|
return AVERROR_INVALIDDATA;
|
|
if ((ret = av_new_packet(pkt, size + 8)) < 0)
|
|
return ret;
|
|
pkt->stream_index = fourxm->video_stream_index;
|
|
pkt->pts = fourxm->video_pts;
|
|
pkt->pos = avio_tell(s->pb);
|
|
memcpy(pkt->data, header, 8);
|
|
ret = avio_read(s->pb, &pkt->data[8], size);
|
|
|
|
if (ret < 0) {
|
|
av_packet_unref(pkt);
|
|
} else {
|
|
packet_read = 1;
|
|
av_shrink_packet(pkt, ret + 8);
|
|
}
|
|
break;
|
|
|
|
case snd__TAG:
|
|
track_number = avio_rl32(pb);
|
|
avio_skip(pb, 4);
|
|
size -= 8;
|
|
|
|
if (track_number < fourxm->track_count &&
|
|
fourxm->tracks[track_number].channels > 0) {
|
|
ret = av_get_packet(s->pb, pkt, size);
|
|
if (ret < 0)
|
|
return ret;
|
|
pkt->stream_index =
|
|
fourxm->tracks[track_number].stream_index;
|
|
pkt->pts = fourxm->tracks[track_number].audio_pts;
|
|
packet_read = 1;
|
|
|
|
/* pts accounting */
|
|
audio_frame_count = size;
|
|
if (fourxm->tracks[track_number].adpcm)
|
|
audio_frame_count -= 2 * (fourxm->tracks[track_number].channels);
|
|
audio_frame_count /= fourxm->tracks[track_number].channels;
|
|
if (fourxm->tracks[track_number].adpcm) {
|
|
audio_frame_count *= 2;
|
|
} else
|
|
audio_frame_count /=
|
|
(fourxm->tracks[track_number].bits / 8);
|
|
fourxm->tracks[track_number].audio_pts += audio_frame_count;
|
|
} else {
|
|
avio_skip(pb, size);
|
|
}
|
|
break;
|
|
|
|
default:
|
|
avio_skip(pb, size);
|
|
break;
|
|
}
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
static int fourxm_read_close(AVFormatContext *s)
|
|
{
|
|
FourxmDemuxContext *fourxm = s->priv_data;
|
|
|
|
av_freep(&fourxm->tracks);
|
|
|
|
return 0;
|
|
}
|
|
|
|
const AVInputFormat ff_fourxm_demuxer = {
|
|
.name = "4xm",
|
|
.long_name = NULL_IF_CONFIG_SMALL("4X Technologies"),
|
|
.priv_data_size = sizeof(FourxmDemuxContext),
|
|
.flags_internal = FF_FMT_INIT_CLEANUP,
|
|
.read_probe = fourxm_probe,
|
|
.read_header = fourxm_read_header,
|
|
.read_packet = fourxm_read_packet,
|
|
.read_close = fourxm_read_close,
|
|
};
|