You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

423 lines
11 KiB

#include "decoder.h"
#include <libavcodec/avcodec.h>
#include <libavformat/avformat.h>
#include <libavutil/audio_fifo.h>
#include <libavutil/channel_layout.h>
#include <glib.h>
#include <stdint.h>
#include "types.h"
#include "log.h"
#include "str.h"
struct decoder_s {
AVCodecContext *avcctx;
AVPacket avpkt;
AVFrame *frame;
unsigned long rtp_ts;
uint64_t pts;
};
struct output_s {
char *filename;
// format params
int clockrate;
int channels;
AVCodecContext *avcctx;
AVFormatContext *fmtctx;
AVStream *avst;
AVPacket avpkt;
AVAudioFifo *fifo;
int64_t fifo_pts; // pts of first data in fifo
int64_t mux_dts; // last dts passed to muxer
AVFrame *frame;
};
struct decoder_def_s {
const char *rtpname;
int clockrate_mult;
int avcodec_id;
const char *avcodec_name;
};
#define DECODER_DEF_MULT_NAME(ref, id, mult, name) { \
.rtpname = #ref, \
.avcodec_id = AV_CODEC_ID_ ## id, \
.clockrate_mult = mult, \
.avcodec_name = #name, \
}
#define DECODER_DEF_MULT(ref, id, mult) DECODER_DEF_MULT_NAME(ref, id, mult, NULL)
#define DECODER_DEF_NAME(ref, id, name) DECODER_DEF_MULT_NAME(ref, id, 1, name)
#define DECODER_DEF(ref, id) DECODER_DEF_MULT(ref, id, 1)
static const struct decoder_def_s decoders[] = {
DECODER_DEF(PCMA, PCM_ALAW),
DECODER_DEF(PCMU, PCM_MULAW),
DECODER_DEF(G723, G723_1),
DECODER_DEF_MULT(G722, ADPCM_G722, 2),
DECODER_DEF(QCELP, QCELP),
DECODER_DEF(G729, G729),
DECODER_DEF(speex, SPEEX),
DECODER_DEF(GSM, GSM),
DECODER_DEF(iLBC, ILBC),
DECODER_DEF_NAME(opus, OPUS, libopus),
DECODER_DEF_NAME(vorbis, VORBIS, libvorbis),
DECODER_DEF(ac3, AC3),
DECODER_DEF(eac3, EAC3),
DECODER_DEF(ATRAC3, ATRAC3),
DECODER_DEF(ATRAC-X, ATRAC3P),
#if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(57, 0, 0)
DECODER_DEF(EVRC, EVRC),
DECODER_DEF(EVRC0, EVRC),
DECODER_DEF(EVRC1, EVRC),
#endif
DECODER_DEF(AMR, AMR_NB),
DECODER_DEF(AMR-WB, AMR_WB),
};
typedef struct decoder_def_s decoder_def_t;
static int output_codec_id;
static const char *output_file_format;
static void output_shutdown(output_t *output);
static int output_config(output_t *output, unsigned int clockrate, unsigned int channels);
static const decoder_def_t *decoder_find(const str *name) {
for (int i = 0; i < G_N_ELEMENTS(decoders); i++) {
if (!str_cmp(name, decoders[i].rtpname))
return &decoders[i];
}
return NULL;
}
decoder_t *decoder_new(const char *payload_str) {
str name;
char *slash = strchr(payload_str, '/');
if (!slash) {
ilog(LOG_WARN, "Invalid payload format: %s", payload_str);
return NULL;
}
str_init_len(&name, (char *) payload_str, slash - payload_str);
int clockrate = atoi(slash + 1);
int channels = 1;
slash = strchr(slash + 1, '/');
if (slash) {
channels = atoi(slash + 1);
if (!channels)
channels = 1;
}
const decoder_def_t *def = decoder_find(&name);
if (!def) {
ilog(LOG_WARN, "No decoder for payload %s", payload_str);
return NULL;
}
clockrate *= def->clockrate_mult;
decoder_t *ret = g_slice_alloc0(sizeof(*ret));
// XXX error reporting
AVCodec *codec = NULL;
if (def->avcodec_name)
codec = avcodec_find_decoder_by_name(def->avcodec_name);
if (!codec)
codec = avcodec_find_decoder(def->avcodec_id);
ret->avcctx = avcodec_alloc_context3(codec);
if (!ret->avcctx)
goto err;
ret->avcctx->channels = channels;
ret->avcctx->sample_rate = clockrate;
int i = avcodec_open2(ret->avcctx, codec, NULL);
if (i)
goto err;
av_init_packet(&ret->avpkt);
ret->frame = av_frame_alloc();
if (!ret->frame)
goto err;
ret->pts = (uint64_t) -1LL;
ret->rtp_ts = (unsigned long) -1L;
return ret;
err:
decoder_close(ret);
return NULL;
}
static int output_flush(output_t *output) {
while (av_audio_fifo_size(output->fifo) >= output->frame->nb_samples) {
if (av_audio_fifo_read(output->fifo, (void **) output->frame->data,
output->frame->nb_samples) <= 0)
abort();
dbg("%p output fifo pts %lu", output, (unsigned long) output->fifo_pts);
output->frame->pts = output->fifo_pts;
#if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(57, 0, 0)
int ret = avcodec_send_frame(output->avcctx, output->frame);
dbg("%p send frame ret %i", output, ret);
if (ret)
return -1;
ret = avcodec_receive_packet(output->avcctx, &output->avpkt);
dbg("%p receive packet ret %i", output, ret);
if (ret)
return -1;
#else
int got_packet = 0;
int ret = avcodec_encode_audio2(output->avcctx, &output->avpkt, output->frame, &got_packet);
dbg("%p encode frame ret %i, got packet %i", output, ret, got_packet);
if (!got_packet)
return 0;
#endif
dbg("%p output avpkt size is %i", output, (int) output->avpkt.size);
dbg("%p output pkt pts/dts is %li/%li", output, (long) output->avpkt.pts,
(long) output->avpkt.dts);
dbg("%p output dts %li", output, (long) output->mux_dts);
// the encoder may return frames with the same dts multiple consecutive times.
// the muxer may not like this, so ensure monotonically increasing dts.
if (output->mux_dts > output->avpkt.dts)
output->avpkt.dts = output->mux_dts;
if (output->avpkt.pts < output->avpkt.dts)
output->avpkt.pts = output->avpkt.dts;
av_write_frame(output->fmtctx, &output->avpkt);
output->fifo_pts += output->frame->nb_samples;
output->mux_dts = output->avpkt.dts + 1; // min next expected dts
}
return 0;
}
static int output_add(output_t *output, AVFrame *frame) {
if (!output)
return -1;
dbg("%p output fifo size %u fifo_pts %lu", output, (unsigned int) av_audio_fifo_size(output->fifo),
(unsigned long) output->fifo_pts);
// fix up output pts
if (av_audio_fifo_size(output->fifo) == 0)
output->fifo_pts = frame->pts;
if (av_audio_fifo_write(output->fifo, (void **) frame->extended_data, frame->nb_samples) < 0)
return -1;
return output_flush(output);
}
int decoder_input(decoder_t *dec, const str *data, unsigned long ts, output_t *output) {
if (G_UNLIKELY(!dec))
return -1;
dbg("%p dec pts %lu rtp_ts %lu incoming ts %lu", dec, (unsigned long) dec->pts,
(unsigned long) dec->rtp_ts, (unsigned long) ts);
if (G_UNLIKELY(dec->rtp_ts == (unsigned long) -1L)) {
// initialize pts
dec->pts = 0;
}
else {
// shift pts according to rtp ts shift
dec->pts += (ts - dec->rtp_ts) /* * output->avst->time_base.num * 8000 / output->avst->time_base.den */ ;
// XXX handle lost packets here if timestamps don't line up?
}
dec->rtp_ts = ts;
dec->avpkt.data = (unsigned char *) data->s;
dec->avpkt.size = data->len;
dec->avpkt.pts = dec->pts;
#if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(57, 0, 0)
int ret = avcodec_send_packet(dec->avcctx, &dec->avpkt);
dbg("send packet ret %i", ret);
if (ret)
return -1;
ret = avcodec_receive_frame(dec->avcctx, dec->frame);
dbg("receive frame ret %i", ret);
if (ret)
return -1;
#else
int got_frame = 0;
int ret = avcodec_decode_audio4(dec->avcctx, dec->frame, &got_frame, &dec->avpkt);
dbg("decode frame ret %i, got frame %i", ret, got_frame);
if (!got_frame)
return 0;
#endif
dec->frame->pts = dec->frame->pkt_pts;
dbg("%p dec frame pts %lu pkt_pts %lu", dec, (unsigned long) dec->frame->pts,
(unsigned long) dec->frame->pkt_dts);
output_config(output, dec->avcctx->sample_rate, dec->avcctx->channels);
if (output_add(output, dec->frame))
return -1;
return 0;
}
output_t *output_new(const char *filename) {
output_t *ret = g_slice_alloc0(sizeof(*ret));
if (asprintf(&ret->filename, "%s.%s", filename, output_file_format) <= 0)
abort();
ret->clockrate = -1;
ret->channels = -1;
ret->frame = av_frame_alloc();
return ret;
}
static int output_config(output_t *output, unsigned int clockrate, unsigned int channels) {
// anything to do?
if (G_UNLIKELY(output->clockrate != clockrate))
goto format_mismatch;
if (G_UNLIKELY(output->channels != channels))
goto format_mismatch;
// all good
return 0;
format_mismatch:
// XXX support reset/config change
// copy params
output->clockrate = clockrate;
output->channels = channels;
// XXX error reporting
output->fmtctx = avformat_alloc_context();
if (!output->fmtctx)
goto err;
output->fmtctx->oformat = av_guess_format(output_file_format, NULL, NULL);
if (!output->fmtctx->oformat)
goto err;
AVCodec *codec = avcodec_find_encoder(output_codec_id);
// XXX error handling
output->avst = avformat_new_stream(output->fmtctx, codec);
if (!output->avst)
goto err;
#if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(57, 0, 0)
output->avcctx = avcodec_alloc_context3(codec);
if (!output->avcctx)
goto err;
#else
output->avcctx = output->avst->codec;
#endif
output->avcctx->channels = output->channels;
output->avcctx->channel_layout = av_get_default_channel_layout(output->channels);
output->avcctx->sample_rate = output->clockrate;
output->avcctx->sample_fmt = AV_SAMPLE_FMT_S16;
output->avcctx->time_base = (AVRational){output->clockrate,1};
output->avst->time_base = output->avcctx->time_base;
#if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(57, 0, 0)
avcodec_parameters_from_context(output->avst->codecpar, output->avcctx);
#endif
int i = avcodec_open2(output->avcctx, codec, NULL);
if (i)
goto err;
i = avio_open(&output->fmtctx->pb, output->filename, AVIO_FLAG_WRITE);
if (i < 0)
goto err;
i = avformat_write_header(output->fmtctx, NULL);
if (i)
goto err;
av_init_packet(&output->avpkt);
// output frame and fifo
output->frame->nb_samples = output->avcctx->frame_size ? : 256;
output->frame->format = output->avcctx->sample_fmt;
output->frame->sample_rate = output->avcctx->sample_rate;
output->frame->channel_layout = output->avcctx->channel_layout;
if (!output->frame->channel_layout)
output->frame->channel_layout = av_get_default_channel_layout(output->avcctx->channels);
if (av_frame_get_buffer(output->frame, 0) < 0)
abort();
output->fifo = av_audio_fifo_alloc(output->avcctx->sample_fmt, output->avcctx->channels,
output->frame->nb_samples);
return 0;
err:
output_shutdown(output);
return -1;
}
void decoder_close(decoder_t *dec) {
if (!dec)
return;
avcodec_free_context(&dec->avcctx);
av_frame_free(&dec->frame);
g_slice_free1(sizeof(*dec), dec);
}
static void output_shutdown(output_t *output) {
if (!output)
return;
av_write_trailer(output->fmtctx);
avcodec_close(output->avcctx);
avio_closep(&output->fmtctx->pb);
avformat_free_context(output->fmtctx);
av_audio_fifo_free(output->fifo);
av_frame_free(&output->frame);
output->avcctx = NULL;
output->fmtctx = NULL;
output->avst = NULL;
output->fifo = NULL;
}
void output_close(output_t *output) {
if (!output)
return;
output_shutdown(output);
free(output->filename);
g_slice_free1(sizeof(*output), output);
}
void output_init(const char *format) {
if (!strcmp(format, "wav")) {
output_codec_id = AV_CODEC_ID_PCM_S16LE;
output_file_format = "wav";
}
else if (!strcmp(format, "mp3")) {
output_codec_id = AV_CODEC_ID_MP3;
output_file_format = "mp3";
}
else
die("Unknown output format '%s'", format);
}