使用ffmpeg实现转码样例(代码实现)

分类： C/C++

使用ffmpeg转码主要工作如下:

Demux -> Decoding -> Encoding -> Muxing

其中接口调用如下：

点击(此处)折叠或打开

av_register_all();

avformat_open_input

avformat_find_stream_info

open_codec_context

av_image_alloc

avcodec_alloc_frame

avformat_alloc_output_context2

avcodec_open2

avcodec_alloc_frame

avpicture_alloc

avformat_write_header

av_init_packet

av_read_frame

avcodec_decode_video2

av_image_copy

avcodec_encode_video2

av_interleaved_write_frame

av_write_trailer

下面的代码为主要将视频转码，封装为h264编码格式的mp4文件，音频为mp3，但是主要操作并不处理音频文件。代码如下

点击(此处)折叠或打开

#include <stdlib.h>

#include <stdio.h>

#include <string.h>

#include <math.h>

#include <libavutil/opt.h>

#include <libavutil/mathematics.h>

#include <libavformat/avformat.h>

#include <libswscale/swscale.h>

#include <libswresample/swresample.h>

/* 5 seconds stream duration */

#define STREAM_DURATION 200.0

#define STREAM_FRAME_RATE 25 /* 25 images/s */

#define STREAM_NB_FRAMES ((int)(STREAM_DURATION * STREAM_FRAME_RATE))

#define STREAM_PIX_FMT AV_PIX_FMT_YUV420P /* default pix_fmt */

static AVFormatContext *input_fmt_ctx = NULL;

static int sws_flags = SWS_BICUBIC;

static AVPacket input_pkt;

static int video_stream_idx = -1;

static uint8_t *video_dst_data[4] = {NULL};

static int video_dst_linesize[4];

static AVStream *input_video_stream;

static AVFrame *input_frame;

static AVCodecContext *video_dec_ctx = NULL;

static int video_dst_bufsize;

static int open_codec_context(int *stream_idx,

AVFormatContext *fmt_ctx, enum AVMediaType type)

{

int ret;

AVStream *st;

AVCodecContext *dec_ctx = NULL;

AVCodec *dec = NULL;

ret = av_find_best_stream(fmt_ctx, type, -1, -1, NULL, 0);

if (ret < 0) {

return ret;

} else {

*stream_idx = ret;

st = fmt_ctx->streams[*stream_idx];

/* find decoder for the stream */

dec_ctx = st->codec;

dec = avcodec_find_decoder(dec_ctx->codec_id);

if (!dec) {

fprintf(stderr, "Failed to find %s codec ",

av_get_media_type_string(type));

return ret;

}

if ((ret = avcodec_open2(dec_ctx, dec, NULL)) < 0) {

fprintf(stderr, "Failed to open %s codec ",

av_get_media_type_string(type));

return ret;

}

return 0;

}

/* Add an output stream. */

static AVStream *add_stream(AVFormatContext *oc, AVCodec **codec,

enum AVCodecID codec_id)

{

AVCodecContext *c;

AVStream *st;

/* find the encoder */

*codec = avcodec_find_encoder(codec_id);

if (!(*codec)) {

fprintf(stderr, "Could not find encoder for '%s' ",

avcodec_get_name(codec_id));

exit(1);

}

st = avformat_new_stream(oc, *codec);

if (!st) {

fprintf(stderr, "Could not allocate stream ");

exit(1);

}

st->id = oc->nb_streams-1;

c = st->codec;

switch ((*codec)->type) {

case AVMEDIA_TYPE_AUDIO:

c->sample_fmt = AV_SAMPLE_FMT_FLTP;

c->bit_rate = 64000;

c->sample_rate = 44100;

c->channels = 2;

break;

case AVMEDIA_TYPE_VIDEO:

c->codec_id = codec_id;

c->bit_rate = 400000;

c->time_base.den = STREAM_FRAME_RATE;

c->time_base.num = 1;

c->gop_size = 12;

c->pix_fmt = STREAM_PIX_FMT;

break;

default:

break;

}

/* Some formats want stream headers to be separate. */

if (oc->oformat->flags & AVFMT_GLOBALHEADER)

c->flags |= CODEC_FLAG_GLOBAL_HEADER;

return st;

}

/**************************************************************/

/* audio output */

static float t, tincr, tincr2;

static uint8_t **src_samples_data;

static int src_samples_linesize;

static int src_nb_samples;

static int max_dst_nb_samples;

uint8_t **dst_samples_data;

int dst_samples_linesize;

int dst_samples_size;

struct SwrContext *swr_ctx = NULL;

static void open_audio(AVFormatContext *oc, AVCodec *codec, AVStream *st)

{

AVCodecContext *c;

int ret;

c = st->codec;

/* open it */

ret = avcodec_open2(c, codec, NULL);

if (ret < 0) {

fprintf(stderr, "Could not open audio codec: %s ", av_err2str(ret));

exit(1);

}

/* init signal generator */

t = 0;

tincr = 2 * M_PI * 110.0 / c->sample_rate;

/* increment frequency by 110 Hz per second */

tincr2 = 2 * M_PI * 110.0 / c->sample_rate / c->sample_rate;

src_nb_samples = c->codec->capabilities & CODEC_CAP_VARIABLE_FRAME_SIZE ?

10000 : c->frame_size;

ret = av_samples_alloc_array_and_samples(&src_samples_data, &src_samples_linesize, c->channels,

src_nb_samples, c->sample_fmt, 0);

if (ret < 0) {

fprintf(stderr, "Could not allocate source samples ");

exit(1);

}

/* create resampler context */

if (c->sample_fmt != AV_SAMPLE_FMT_S16) {

swr_ctx = swr_alloc();

if (!swr_ctx) {

fprintf(stderr, "Could not allocate resampler context ");

exit(1);

}

/* set options */

av_opt_set_int (swr_ctx, "in_channel_count", c->channels, 0);

av_opt_set_int (swr_ctx, "in_sample_rate", c->sample_rate, 0);

av_opt_set_sample_fmt(swr_ctx, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);

av_opt_set_int (swr_ctx, "out_channel_count", c->channels, 0);

av_opt_set_int (swr_ctx, "out_sample_rate", c->sample_rate, 0);

av_opt_set_sample_fmt(swr_ctx, "out_sample_fmt", c->sample_fmt, 0);

/* initialize the resampling context */

if ((ret = swr_init(swr_ctx)) < 0) {

fprintf(stderr, "Failed to initialize the resampling context ");

exit(1);

}

/* compute the number of converted samples: buffering is avoided

* ensuring that the output buffer will contain at least all the

* converted input samples */

max_dst_nb_samples = src_nb_samples;

ret = av_samples_alloc_array_and_samples(&dst_samples_data, &dst_samples_linesize, c->channels,

max_dst_nb_samples, c->sample_fmt, 0);

if (ret < 0) {

fprintf(stderr, "Could not allocate destination samples ");

exit(1);

}

dst_samples_size = av_samples_get_buffer_size(NULL, c->channels, max_dst_nb_samples,

c->sample_fmt, 0);

}

/* Prepare a 16 bit dummy audio frame of 'frame_size' samples and

* 'nb_channels' channels. */

static void get_audio_frame(int16_t *samples, int frame_size, int nb_channels)

{

int j, i, v;

int16_t *q;

q = samples;

for (j = 0; j < frame_size; j++) {

v = (int)(sin(t) * 10000);

for (i = 0; i < nb_channels; i++)

*q++ = v;

t += tincr;

tincr += tincr2;

}

static void write_audio_frame(AVFormatContext *oc, AVStream *st)

{

AVCodecContext *c;

AVPacket pkt = { 0 }; // data and size must be 0;

AVFrame *frame = avcodec_alloc_frame();

int got_packet, ret, dst_nb_samples;

av_init_packet(&pkt);

c = st->codec;

get_audio_frame((int16_t *)src_samples_data[0], src_nb_samples, c->channels);

/* convert samples from native format to destination codec format, using the resampler */

if (swr_ctx) {

/* compute destination number of samples */

dst_nb_samples = av_rescale_rnd(swr_get_delay(swr_ctx, c->sample_rate) + src_nb_samples,

c->sample_rate, c->sample_rate, AV_ROUND_UP);

if (dst_nb_samples > max_dst_nb_samples) {

av_free(dst_samples_data[0]);

ret = av_samples_alloc(dst_samples_data, &dst_samples_linesize, c->channels,

dst_nb_samples, c->sample_fmt, 0);

if (ret < 0)

exit(1);

max_dst_nb_samples = dst_nb_samples;

dst_samples_size = av_samples_get_buffer_size(NULL, c->channels, dst_nb_samples,

c->sample_fmt, 0);

}

/* convert to destination format */

ret = swr_convert(swr_ctx,

dst_samples_data, dst_nb_samples,

(const uint8_t **)src_samples_data, src_nb_samples);

if (ret < 0) {

fprintf(stderr, "Error while converting ");

exit(1);

}

} else {

dst_samples_data[0] = src_samples_data[0];

dst_nb_samples = src_nb_samples;

}

frame->nb_samples = dst_nb_samples;

avcodec_fill_audio_frame(frame, c->channels, c->sample_fmt,

dst_samples_data[0], dst_samples_size, 0);

ret = avcodec_encode_audio2(c, &pkt, frame, &got_packet);

if (ret < 0) {

fprintf(stderr, "Error encoding audio frame: %s ", av_err2str(ret));

exit(1);

}

if (!got_packet)

return;

pkt.stream_index = st->index;

/* Write the compressed frame to the media file. */

ret = av_interleaved_write_frame(oc, &pkt);

if (ret != 0) {

fprintf(stderr, "Error while writing audio frame: %s ",

av_err2str(ret));

exit(1);

}

avcodec_free_frame(&frame);

}

static void close_audio(AVFormatContext *oc, AVStream *st)

{

avcodec_close(st->codec);

av_free(src_samples_data[0]);

av_free(dst_samples_data[0]);

}

/***********************bbs.ChinaFFmpeg.com****孙悟空***********************/

/* video output */

static AVFrame *frame;

static AVPicture src_picture, dst_picture;

static int frame_count;

static void open_video(AVFormatContext *oc, AVCodec *codec, AVStream *st)

{

int ret;

AVCodecContext *c = st->codec;

/* open the codec */

ret = avcodec_open2(c, codec, NULL);

if (ret < 0) {

fprintf(stderr, "Could not open video codec: %s ", av_err2str(ret));

exit(1);

}

/* allocate and init a re-usable frame */

frame = avcodec_alloc_frame();

if (!frame) {

fprintf(stderr, "Could not allocate video frame ");

exit(1);

}

/* Allocate the encoded raw picture. */

ret = avpicture_alloc(&dst_picture, c->pix_fmt, c->width, c->height);

if (ret < 0) {

fprintf(stderr, "Could not allocate picture: %s ", av_err2str(ret));

exit(1);

}

/* If the output format is not YUV420P, then a temporary YUV420P

* picture is needed too. It is then converted to the required

* output format. */

if (c->pix_fmt != AV_PIX_FMT_YUV420P) {

ret = avpicture_alloc(&src_picture, AV_PIX_FMT_YUV420P, c->width, c->height);

if (ret < 0) {

fprintf(stderr, "Could not allocate temporary picture: %s ",

av_err2str(ret));

exit(1);

}

/* copy data and linesize picture pointers to frame */

*((AVPicture *)frame) = dst_picture;

}

static void write_video_frame(AVFormatContext *oc, AVStream *st)

{

int ret;

static struct SwsContext *sws_ctx;

AVCodecContext *c = st->codec;

// fill_yuv_image(&dst_picture, frame_count, c->width, c->height);

if (oc->oformat->flags & AVFMT_RAWPICTURE) {

/* Raw video case - directly store the picture in the packet */

AVPacket pkt;

av_init_packet(&pkt);

pkt.flags |= AV_PKT_FLAG_KEY;

pkt.stream_index = st->index;

pkt.data = dst_picture.data[0];

pkt.size = sizeof(AVPicture);

ret = av_interleaved_write_frame(oc, &pkt);

} else {

AVPacket pkt = { 0 };

int got_packet;

av_init_packet(&pkt);

/* encode the image */

ret = avcodec_encode_video2(c, &pkt, frame, &got_packet);

if (ret < 0) {

fprintf(stderr, "Error encoding video frame: %s ", av_err2str(ret));

exit(1);

}

/* If size is zero, it means the image was buffered. */

if (!ret && got_packet && pkt.size) {

pkt.stream_index = st->index;

/* Write the compressed frame to the media file. */

ret = av_interleaved_write_frame(oc, &pkt);

} else {

ret = 0;

}

if (ret != 0) {

fprintf(stderr, "Error while writing video frame: %s ", av_err2str(ret));

exit(1);

}

frame_count++;

}

static void close_video(AVFormatContext *oc, AVStream *st)

{

avcodec_close(st->codec);

av_free(src_picture.data[0]);

av_free(dst_picture.data[0]);

av_free(frame);

}

/**************************************************************/

/* media file output */

int main(int argc, char **argv)

{

const char *filename;

const char *input_file;

AVOutputFormat *fmt;

AVFormatContext *oc;

AVStream *audio_st, *video_st;

AVCodec *audio_codec, *video_codec;

double audio_time, video_time;

int ret;

int decoded;

int got_frame;

/* Initialize libavcodec, and register all codecs and formats. */

av_register_all();

if (argc != 3) {

printf("usage: %s output_file inputfile "

"API example program to output a media file with libavformat. "

"This program generates a synthetic audio and video stream, encodes and "

"muxes them into a file named output_file. "

"The output format is automatically guessed according to the file extension. "

"Raw images can also be output by using '%%d' in the filename. "

" ", argv[0]);

return 1;

}

input_file = argv[2];

filename = argv[1];

if (avformat_open_input( &input_fmt_ctx, input_file, NULL, NULL) < 0) {

fprintf(stderr, "Could not open source file %s ", input_file);

exit(-1);

}

/* retrieve stream information */

if (avformat_find_stream_info(input_fmt_ctx, NULL) < 0) {

fprintf(stderr, "Could not find stream information ");

exit(1);

}

if (open_codec_context(&video_stream_idx, input_fmt_ctx, AVMEDIA_TYPE_VIDEO) >= 0) {

input_video_stream = input_fmt_ctx->streams[video_stream_idx];

video_dec_ctx = input_video_stream->codec;

ret = av_image_alloc(video_dst_data, video_dst_linesize,

video_dec_ctx->width, video_dec_ctx->height,

video_dec_ctx->pix_fmt, 1);

if (ret < 0) {

fprintf(stderr, "Could not allocate raw video buffer ");

}

video_dst_bufsize = ret;

}

input_frame = avcodec_alloc_frame();

if (!input_frame) {

fprintf(stderr, "Could not allocate frame ");

ret = AVERROR(ENOMEM);

exit(-1);

}

/* allocate the output media context */

avformat_alloc_output_context2(&oc, NULL, NULL, filename);

if (!oc) {

printf("Could not deduce output format from file extension: using MPEG. ");

avformat_alloc_output_context2(&oc, NULL, "mpeg", filename);

}

if (!oc) {

return 1;

}

fmt = oc->oformat;

video_st = NULL;

audio_st = NULL;

fmt->video_codec = AV_CODEC_ID_H264;

if (fmt->video_codec != AV_CODEC_ID_NONE) {

video_st = add_stream(oc, &video_codec, AV_CODEC_ID_H264);

}

if (video_st->codec) {

video_st->codec->width = video_dec_ctx->width;

video_st->codec->height = video_dec_ctx->height;

}

fmt->audio_codec = AV_CODEC_ID_MP3;

if (fmt->audio_codec != AV_CODEC_ID_NONE) {

audio_st = add_stream(oc, &audio_codec, AV_CODEC_ID_MP3);

}

/* Now that all the parameters are set, we can open the audio and

* video codecs and allocate the necessary encode buffers. */

if (video_st)

open_video(oc, video_codec, video_st);

if (audio_st)

open_audio(oc, audio_codec, audio_st);

av_dump_format(oc, 0, filename, 1);

/* open the output file, if needed */

if (!(fmt->flags & AVFMT_NOFILE)) {

ret = avio_open(&oc->pb, filename, AVIO_FLAG_WRITE);

if (ret < 0) {

fprintf(stderr, "Could not open '%s': %s ", filename,

av_err2str(ret));

return 1;

}

/* Write the stream header, if any. */

ret = avformat_write_header(oc, NULL);

if (ret < 0) {

fprintf(stderr, "Error occurred when opening output file: %s ",

av_err2str(ret));

return 1;

}

av_init_packet(&input_pkt);

input_pkt.data = NULL;

input_pkt.size = 0;

if (frame)

frame->pts = 0;

for (;;) {

/* Compute current audio and video time. */

audio_time = audio_st ? audio_st->pts.val * av_q2d(audio_st->time_base) : 0.0;

video_time = video_st ? video_st->pts.val * av_q2d(video_st->time_base) : 0.0;

if ((!audio_st || audio_time >= STREAM_DURATION) &&

(!video_st || video_time >= STREAM_DURATION))

break;

/* write interleaved audio and video frames */

if (!video_st || (video_st && audio_st && audio_time < video_time)) {

write_audio_frame(oc, audio_st);

} else {

av_read_frame(input_fmt_ctx, &input_pkt);

decoded = input_pkt.size;

if (input_pkt.stream_index == video_stream_idx) {

/* decode video frame */

ret = avcodec_decode_video2(video_dec_ctx, input_frame, &got_frame, &input_pkt);

if (ret < 0) {

fprintf(stderr, "Error decoding video frame ");

return ret;

}

if (got_frame) {

av_image_copy(&dst_picture, video_dst_linesize,

(const uint8_t **)(input_frame->data), input_frame->linesize,

video_dec_ctx->pix_fmt, video_dec_ctx->width, video_dec_ctx->height);

}

write_video_frame(oc, video_st);

frame->pts += av_rescale_q(1, video_st->codec->time_base, video_st->time_base);

}

av_write_trailer(oc);

/* Close each codec. */

if (video_st)

close_video(oc, video_st);

if (audio_st)

close_audio(oc, audio_st);

if (!(fmt->flags & AVFMT_NOFILE))

avio_close(oc->pb);

avformat_free_context(oc);

av_free(input_frame);

av_free(video_dst_data[0]);

avcodec_close(video_dec_ctx);

return 0;

}

以上代码为从dox/example/muxing.c中修改得到

编译命令如下：

点击(此处)折叠或打开

gcc -g doc/examples/muxing.c -o muxing -lavcodec -lavdevice -lavfilter -lavformat -lavutil -lswscale -lswresample -lpostproc -lx264 -lmp3lame -lz -liconv -lbz2

执行命令如下：

点击(此处)折叠或打开

执行后效果如下：

查看转码完成后的多媒体文件的信息：
使用ffmpeg实现转码样例(代码实现)

查看转码后的文件的视频:
使用ffmpeg实现转码样例(代码实现)

使用ffmpeg实现转码样例(代码实现)

相关推荐