使用ffmpeg介面解封裝解碼為YUV

阿新 • • 發佈：2019-02-15

第一步: 相關結構的初始化

第一步: 通過開啟檔案獲取 AVFormatContext(解封裝輸入檔案格式)

第二步: 通過開啟檔案的 AVFormatContext,獲取音訊和視訊AVStream

第三步: 獲取音訊和視訊解碼器上下文和解碼器例項

avcodec_find_decoder和avcodec_open2開啟解碼器準備解碼音視訊流。該部分的程式碼實現如：

static int open_codec_context(IOFileName &files, DemuxingVideoAudioContex &va_ctx, enum AVMediaType type)
{
int ret, stream_index;
AVStream *st;
AVCodecContext *dec_ctx = NULL;
AVCodec *dec = NULL;
AVDictionary *opts = NULL;

ret = av_find_best_stream(va_ctx.fmt_ctx, type, -1, -1, NULL, 0);
if (ret < 0)
{
fprintf(stderr, “Could not find %s stream in input file ‘%s’\n”, av_get_media_type_string(type), files.src_filename);
return ret;
}
else
{
stream_index = ret;
st = va_ctx.fmt_ctx->streams[stream_index];

* find decoder for the stream *
dec_ctx = st->codec;
dec = avcodec_find_decoder(dec_ctx->codec_id);
if (!dec)
{
fprintf(stderr, “Failed to find %s codec\n”, av_get_media_type_string(type));
return AVERROR(EINVAL);
}

* Init the decoders, with or without reference counting *
av_dict_set(&opts, “refcounted_frames”, files.refcount ? “1” : “0”, 0);
if ((ret = avcodec_open2(dec_ctx, dec, &opts)) < 0)
{
fprintf(stderr, “Failed to open %s codec\n”, av_get_media_type_string(type));
return ret;
}

switch (type)  
{  
case AVMEDIA\_TYPE\_VIDEO:  
    va\_ctx.video\_stream\_idx = stream\_index;  
    va\_ctx.video\_stream = va\_ctx.fmt\_ctx->streams[stream\_index];  
    va\_ctx.video\_dec\_ctx = va\_ctx.video\_stream->codec;  
    break;  
case AVMEDIA\_TYPE\_AUDIO:  
    va\_ctx.audio\_stream\_idx = stream\_index;  
    va\_ctx.audio\_stream = va\_ctx.fmt\_ctx->streams[stream\_index];  
    va\_ctx.audio\_dec\_ctx = va\_ctx.audio\_stream->codec;  
    break;  
default:  
    fprintf(stderr, "Error: unsupported MediaType: %s\n", av\_get\_media\_type\_string(type));  
    return -1;  
}

}

return 0;

}

整體初始化的函式程式碼為

int InitDemuxContext(IOFileName &files, DemuxingVideoAudioContex &va_ctx)
{
int ret = 0, width, height;

* register all formats and codecs *
av_register_all();

* open input file, and allocate format context *
if (avformat_open_input(&(va_ctx.fmt_ctx), files.src_filename, NULL, NULL) < 0)
{
fprintf(stderr, “Could not open source file %s\n”, files.src_filename);
return -1;
}

* retrieve stream information *
if (avformat_find_stream_info(va_ctx.fmt_ctx, NULL) < 0)
{
fprintf(stderr, “Could not find stream information\n”);
return -1;
}

if (open_codec_context(files, va_ctx, AVMEDIA_TYPE_VIDEO) >= 0)
{
files.video_dst_file = fopen(files.video_dst_filename, “wb”);
if (!files.video_dst_file)
{
fprintf(stderr, “Could not open destination file %s\n”, files.video_dst_filename);
return -1;
}

*\* allocate image where the decoded image will be put \**  
va\_ctx.width = va\_ctx.video\_dec\_ctx->width;  
va\_ctx.height = va\_ctx.video\_dec\_ctx->height;  
va\_ctx.pix\_fmt = va\_ctx.video\_dec\_ctx->pix\_fmt;  
ret = av\_image\_alloc(va\_ctx.video\_dst\_data, va\_ctx.video\_dst\_linesize, va\_ctx.width, va\_ctx.height, va\_ctx.pix\_fmt, 1);  
if (ret < 0)  
{  
    fprintf(stderr, "Could not allocate raw video buffer\n");  
    return -1;  
}  
va\_ctx.video\_dst\_bufsize = ret;

}

if (open_codec_context(files, va_ctx, AVMEDIA_TYPE_AUDIO) >= 0)
{
files.audio_dst_file = fopen(files.audio_dst_filename, “wb”);
if (!files.audio_dst_file)
{
fprintf(stderr, “Could not open destination file %s\n”, files.audio_dst_filename);
return -1;
}
}

if (va_ctx.video_stream)
{
printf(“Demuxing video from file ‘%s’ into ‘%s’\n”, files.src_filename, files.video_dst_filename);
}

if (va_ctx.audio_stream)
{
printf(“Demuxing audio from file ‘%s’ into ‘%s’\n”, files.src_filename, files.audio_dst_filename);
}

* dump input information to stderr *
av_dump_format(va_ctx.fmt_ctx, 0, files.src_filename, 0);

if (!va_ctx.audio_stream && !va_ctx.video_stream)
{
fprintf(stderr, “Could not find audio or video stream in the input, aborting\n”);
return -1;
}

return 0;

}

分配AVFrame和初始化AVPacket物件：

va_ctx.frame = av_frame_alloc(); //分配AVFrame結構物件
if (!va_ctx.frame)
{
fprintf(stderr, “Could not allocate frame\n”);
ret = AVERROR(ENOMEM);
goto end;
}

* initialize packet, set data to NULL, let the demuxer fill it *
av_init_packet(&va_ctx.pkt); //初始化AVPacket物件
va_ctx.pkt.data = NULL;
va_ctx.pkt.size = 0;

第二步: 迴圈解析視訊檔案的包資料

解析視訊檔案的迴圈程式碼段為：

* read frames from the file *
while (av_read_frame(va_ctx.fmt_ctx, &va_ctx.pkt) >= 0) //從輸入程式中讀取一個包的資料
{
AVPacket orig_pkt = va_ctx.pkt;
do
{
ret = Decode_packet(files, va_ctx, &got_frame, 0); //解碼這個包
if (ret < 0)
break;
va_ctx.pkt.data += ret;
va_ctx.pkt.size -= ret;
} while (va_ctx.pkt.size > 0);
av_packet_unref(&orig_pkt);
}

這部分程式碼邏輯上非常簡單，首先呼叫av_read_frame函式，從檔案中讀取一個packet的資料，並實現了一個Decode_packet對這個packet進行解碼。Decode_packet函式的實現如下：

int Decode_packet(IOFileName &files, DemuxingVideoAudioContex &va_ctx, int *got_frame, int cached)
{
int ret = 0;
int decoded = va_ctx.pkt.size;
static int video_frame_count = 0;
static int audio_frame_count = 0;

*got_frame = 0;

if (va_ctx.pkt.stream_index == va_ctx.video_stream_idx)
{
* decode video frame *
ret = avcodec_decode_video2(va_ctx.video_dec_ctx, va_ctx.frame, got_frame, &va_ctx.pkt);
if (ret < 0)
{
printf(“Error decoding video frame (%d)\n”, ret);
return ret;
}

if (*got_frame)
{
if (va_ctx.frame->width != va_ctx.width || va_ctx.frame->height != va_ctx.height ||
va_ctx.frame->format != va_ctx.pix_fmt)
{
/* To handle this change, one could call av_image_alloc again and

decode the following frames into another rawvideo file. */

printf(“Error: Width, height and pixel format have to be ”
“constant in a rawvideo file, but the width, height or ”
“pixel format of the input video changed:\n”
“old: width = %d, height = %d, format = %s\n”
“new: width = %d, height = %d, format = %s\n”,
va_ctx.width, va_ctx.height, av_get_pix_fmt_name((AVPixelFormat)(va_ctx.pix_fmt)),
va_ctx.frame->width, va_ctx.frame->height,
av_get_pix_fmt_name((AVPixelFormat)va_ctx.frame->format));
return -1;
}

printf(“video_frame%s n:%d coded_n:%d pts:%s\n”, cached ? “(cached)” : “”, video_frame_count++, va_ctx.frame->coded_picture_number, va_ctx.frame->pts);

/* copy decoded frame to destination buffer:

this is required since rawvideo expects non aligned data */

av_image_copy(va_ctx.video_dst_data, va_ctx.video_dst_linesize,
(const uint8_t **)(va_ctx.frame->data), va_ctx.frame->linesize,
va_ctx.pix_fmt, va_ctx.width, va_ctx.height);

    *\* write to rawvideo file \**  
    fwrite(va\_ctx.video\_dst\_data[0], 1, va\_ctx.video\_dst\_bufsize, files.video\_dst\_file);  
}

}
else if (va_ctx.pkt.stream_index == va_ctx.audio_stream_idx)
{
* decode audio frame *
ret = avcodec_decode_audio4(va_ctx.audio_dec_ctx, va_ctx.frame, got_frame, &va_ctx.pkt);
if (ret < 0)
{
printf(“Error decoding audio frame (%s)\n”, ret);
return ret;
}
/* Some audio decoders decode only part of the packet, and have to be

called again with the remainder of the packet data.
Sample: fate-suite/lossless-audio/luckynight-partial.shn
Also, some decoders might over-read the packet. */

decoded = FFMIN(ret, va_ctx.pkt.size);

if (*got_frame)
{
size_t unpadded_linesize = va_ctx.frame->nb_samples * av_get_bytes_per_sample((AVSampleFormat)va_ctx.frame->format);
printf(“audio_frame%s n:%d nb_samples:%d pts:%s\n”,
cached ? “(cached)” : “”,
audio_frame_count++, va_ctx.frame->nb_samples,
va_ctx.frame->pts);

/* Write the raw audio data samples of the first plane. This works

fine for packed formats (e.g. AV_SAMPLE_FMT_S16). However,
most audio decoders output planar audio, which uses a separate
plane of audio samples for each channel (e.g. AV_SAMPLE_FMT_S16P).
In other words, this code will write only the first audio channel
in these cases.
You should use libswresample or libavfilter to convert the frame

to packed data. */

fwrite(va\_ctx.frame->extended\_data[0], 1, unpadded\_linesize, files.audio\_dst\_file);

}
}

/* If we use frame reference counting, we own the data and need

to de-reference it when we don’t use it anymore */

if (*got_frame && files.refcount)
av_frame_unref(va_ctx.frame);

    return decoded;

}

在該函式中，首先對讀取到的packet中的stream_index分別於先前獲取的音訊和視訊的stream_index進行對比來確定是音訊還是視訊流。而後分別呼叫相應的解碼函式進行解碼，以視訊流為例，判斷當前stream為視訊流後，呼叫avcodec_decode_video2函式將流資料解碼為畫素資料，並在獲取完整的一幀之後，將其寫出到輸出檔案中。

使用ffmpeg介面解封裝解碼為YUV

第一步: 相關結構的初始化

第一步: 通過開啟檔案獲取 AVFormatContext(解封裝輸入檔案格式)

第二步: 通過開啟檔案的 AVFormatContext,獲取音訊和視訊AVStream

第三步: 獲取音訊和視訊解碼器上下文和解碼器例項

整體初始化的函式程式碼為

分配AVFrame和初始化AVPacket物件：

第二步: 迴圈解析視訊檔案的包資料

使用ffmpeg介面解封裝解碼為YUV

FFmpeg In Android - 多媒體檔案解封裝/解碼/儲存Yuv

FFmpeg把MP4檔案解碼為YUV，然後通過SDL播放

使用ffmpeg介面將h.264解碼為YUV

7.基於FFMPEG將video解碼為YUV

使用 ffmpeg 進行網路推流：拉流->解封裝->解碼->處理原始資料（音訊、視訊）->編碼->編碼->推流

利用ffmpeg將H264流解碼為RGB

使用FFMPEG3.4.2版本進行視訊的解碼為YUV格式

Delphi 中，基於介面，封裝類為 BPL 包動態載入的程式架構之一

javacpp-FFmpeg系列之2：通用拉流解碼器，支持視頻拉流解碼並轉換為YUV、BGR24或RGB24等圖像像素數據

FFmpeg 4.0.2 解碼h264為YUV

從零實現簡易播放器:4.ffmpeg 解碼視訊為yuv資料-使用avcodec_send_packet與avcodec_receive_frame

ffmpeg實戰教程（一）Mp4，mkv等格式解碼為h264和yuv資料

ffmpeg最簡單的解碼保存YUV數據 <轉>

04 ffmpeg 從媒體文件解封裝，輸出YUV420圖像

FFMPEG實現對AAC解碼(不採用封裝格式實現)

FFMPEG實現對AAC解碼(採用封裝格式實現)

FFmpeg In Android - H264碼流解碼/儲存Yuv

4.基於FFMPEG將音訊解碼為PCM

呼叫FFmpeg SDK解析封裝格式的視訊為音訊流和視訊流

使用ffmpeg介面解封裝解碼為YUV

第一步: 相關結構的初始化

第一步: 通過開啟檔案獲取 AVFormatContext(解封裝輸入檔案格式)

第二步: 通過開啟檔案的 AVFormatContext,獲取音訊和視訊AVStream

第三步: 獲取音訊和視訊解碼器上下文和解碼器例項

整體初始化的函式程式碼為

分配AVFrame和初始化AVPacket物件：

第二步: 迴圈解析視訊檔案的包資料

相關推薦