使用 liavformat 和 libavcodec 實現編碼器

阿新 • • 發佈：2018-11-25

使用ffmpeg 的liavformat 封裝，使用libavcodec encodec，實現個編碼器，封裝yuv 檔案為flv/mp4等格式檔案。

視訊編碼的過程是解碼的逆過程，編碼的流程，從資料結構上看就是AVFrame-> AVPacket->AVCodecContext->AVFormatContext。生成AVPacket 為封裝，生成AVFrame 為encodec。其中，AVFormatContext:封裝格式上下文結構體，也是統領全域性的結構體，儲存了視訊檔案封裝格式相關資訊；AVCodecContext:編碼器上下文結構體，儲存了視訊(音訊)編解碼相關資訊；AVPacket:儲存一幀壓縮編碼資料;AVFrame:儲存一幀解碼後像素(取樣)資料。

編碼過程相對於解碼過程複雜點，因為解碼不需要關注各種引數，而編碼要設定各種複雜的引數，特使是時間戳的關係，這個搞不明白，就會出現幀率不對的情況。下面是雷神總結的流程圖：

他寫的程式碼只有encode，並沒有封裝過程，本文完成了後面部分，並做了部分修改。原始碼如下：

#include <stdio.h>
#include <libavutil/opt.h>
#include <libavformat/avformat.h>
#include <libavcodec/avcodec.h>
#include <libavutil/imgutils.h>
 
//test different codec
#define TEST_H264  1
 
 
int main(int argc, char* argv[])
{
	AVCodec *pCodec;
    AVCodecContext *pCodecCtx= NULL;
    int i, ret, got_output;
    FILE *fp_in;
	FILE *fp_out;
    AVFrame *pFrame;
    AVPacket pkt;
    AVStream *video_st;
	int y_size;
	int framecnt=0;
    int framerate=25;
 
	char filename_in[] = "in_1280x720.yuv"; //輸入yuv檔案， 必須註明解析度
	enum AVCodecID codec_id = AV_CODEC_ID_H264;

    // 輸出檔名
	char * h264_out = "out.h264";
    char * flv_out = "out.mp4";

    // 輸出 format
    AVFormatContext *ofmt_ctx = NULL; 
 
	int in_w=1280, in_h=720;	//對應的解析度
    int out_w = 1280, out_h = 720;
	int framenum=10000;	
 
    // 註冊所有編碼器
	av_register_all();

    // 初始化 out format
    avformat_alloc_output_context2(&ofmt_ctx, NULL, NULL, flv_out);
    if (!ofmt_ctx) {
        printf( "Could not create output context\n");
        ret = AVERROR_UNKNOWN;
        return -1 ;
    }

    //Open output file
    if (!(ofmt_ctx->oformat->flags & AVFMT_NOFILE)) {
        ret = avio_open(&ofmt_ctx->pb, flv_out, AVIO_FLAG_WRITE);//開啟輸出檔案。
        if (ret < 0) {
            printf( "Could not open output file '%s'", flv_out);
            return -1;
        }
    }

    video_st = avformat_new_stream(ofmt_ctx, 0);
    // 設定幀率，有的封裝格式，這個引數會被後面 avformat_write_header 覆蓋

    // 輸出 codec 的引數，這裡的引數一般ffmpeg 可以parse arg 得到，這裡暫時寫死
    pCodecCtx = video_st->codec;
    if (!pCodecCtx) {
        printf("Could not allocate video codec context\n");
        return -1;
    }
    pCodecCtx->codec_id = codec_id;
    pCodecCtx->codec_type = AVMEDIA_TYPE_VIDEO;
    pCodecCtx->bit_rate = 5000; 
    pCodecCtx->width = out_w; 
    pCodecCtx->height = out_h;
    pCodecCtx->time_base.num=1;
	pCodecCtx->time_base.den=25;

    // h264重要引數，不設定會報錯
    pCodecCtx->qmin = 10;
	pCodecCtx->qmax = 51;

    pCodecCtx->gop_size = 250;
    pCodecCtx->max_b_frames = 1;
    pCodecCtx->pix_fmt = AV_PIX_FMT_YUV420P;
 
    if (codec_id == AV_CODEC_ID_H264)
        av_opt_set(pCodecCtx->priv_data, "preset", "slow", 0);

    
    //開啟 codec 編碼器

    pCodec = avcodec_find_encoder(pCodecCtx->codec_id);
    if (!pCodec) {
        printf("Codec not found\n");
        return -1;
    }
 
    if (avcodec_open2(pCodecCtx, pCodec, NULL) < 0) {
        printf("Could not open codec\n");
        return -1;
    }
    
	//Input raw data
	fp_in = fopen(filename_in, "rb");
	if (!fp_in) {
		printf("Could not open %s\n", filename_in);
		return -1;
	}
	//h264 Output bitstream
	fp_out = fopen(h264_out, "wb");
	if (!fp_out) {
		printf("Could not open %s\n", h264_out);
		return -1;
	}

    // AVDictionary* opt = NULL;
    // av_dict_set_int(&opt, "video_track_timescale", 25, 0);
    //Write file header
    if (avformat_write_header(ofmt_ctx, NULL) < 0) {
        printf( "Error occurred when opening output file\n");
        return -1;
    }

    // init pFrame 
    pFrame = av_frame_alloc();
    if (!pFrame) {
        printf("Could not allocate video frame\n");
        return -1;
    }
    pFrame->format = pCodecCtx->pix_fmt;
    pFrame->width  = in_w;
    pFrame->height = in_h;
 
    ret = av_image_alloc(pFrame->data, pFrame->linesize, in_w, in_h,
                         pCodecCtx->pix_fmt, 1);
    if (ret < 0) {
        printf("Could not allocate raw picture buffer\n");
        return -1;
    }

    y_size = in_h * in_w;
    //Encode
    for (i; i< 5000; i++){
        av_init_packet(&pkt);
        pkt.data = NULL;    // packet data will be allocated by the encoder
        pkt.size = 0;
		//Read raw YUV data
		if (fread(pFrame->data[0],1,y_size,fp_in)<= 0||		// Y
			fread(pFrame->data[1],1,y_size/4,fp_in)<= 0||	// U
			fread(pFrame->data[2],1,y_size/4,fp_in)<= 0){	// V
			break;
		}else if(feof(fp_in)){
            printf("read yuv file meet error\n");
			break;
		}
 
        pFrame->pts = i;

        /* encode the pFrame */
        ret = avcodec_encode_video2(pCodecCtx, &pkt, pFrame, &got_output);
        if (ret < 0) {
            printf("Error encoding frame\n");
            return -1;
        }

        //由於裸流裡本來就沒有可靠的pts和timebase等資料，pts的計算依靠設定的幀率
        double calc_duration = (double)1/framerate;
        pkt.pts = (double)(framecnt*calc_duration) / (av_q2d(video_st->time_base));
        pkt.dts = pkt.pts;
        pkt.duration = calc_duration / av_q2d(video_st->time_base);

        if (got_output) {
            printf("Succeed to encode frame: %5d\tsize:%5d\n",framecnt,pkt.size);
			framecnt++;
            pkt.stream_index = video_st->index;
            fwrite(pkt.data, 1, pkt.size, fp_out);
            av_interleaved_write_frame(ofmt_ctx, &pkt); //將AVPacket（儲存視訊壓縮碼流資料）寫入檔案
        }

       
        av_free_packet(&pkt);
    }
 
    av_write_trailer(ofmt_ctx); // write tailer

    // 釋放記憶體
    fclose(fp_out);
    avcodec_close(video_st->codec);
    avcodec_close(pCodecCtx);
    av_free(pCodecCtx);
    av_freep(&pFrame->data[0]);
    av_frame_free(&pFrame);
 
	return 0;
}

在寫編碼器的過程中，位元速率一直控制的不準，出現了幀率控制不好的情況，有參考這個文章：https://blog.csdn.net/mj1523/article/details/50434977 ，但是後來發現，其實幀率控制不需要那麼做，因為是裸流，pkg 的pts 沒有設定引起的。然後加上pkg 生成部分的pts 設定，問題得以解決。

下面大致介紹下，pts，dts 區別，為什麼有這個區別，該怎麼取值等問題, timebase又是個啥玩意？

首先是為什麼package 要有pts， dts 這兩個玩意？首先，視訊顯示是一幀一幀，但是編碼並不是一幀的。視訊分為I P B 幀，需要在顯示B幀之前知道P幀中的資訊，所以沒有B 幀的時候，pts，dts 編碼時間和顯示時間就是一致的，但是有的時候，編碼的時候P 幀需要提前。

為什麼取值的時候有timebase, ffmpeg 各個資料層之間的時間基準不一樣，不能直接相互使用，否則會出現溢位的情況，比如mux/demux層的timebase，flv，MP4等一般是1:1000，ts一般是1:90*1000 。codec/decode層timebase，h264隨著幀率變化例如1:25 aac根據取樣率變化例如1:44100。c：Raw data 層的timebase有很多變化比如1:1000*1000 或1:1000等等。

最後是pts 怎麼取值的問題，類似轉碼，有穩定的輸入值參考，可以直接使用輸入 AVStream 的pts 給輸出pkg 賦值，像本文這種情況，是使用的裸流，就需要自己通過幀率和timebase 進行計算，計算過程就較為簡單，查下對應公式即可。

使用 liavformat 和 libavcodec 實現編碼器

使用 liavformat 和 libavcodec 實現編碼器

使用 liavformat 和 libavcodec 實現解碼器

增量式編碼器和絕對式編碼器，ABI訊號和UVW訊號、編碼器PWM訊號

實現硬體PWM控制電機旋轉和通過編碼器計算所轉圈數的簡單例程

seq2seq通俗理解----編碼器和解碼器(TensorFlow實現)

哈夫曼編碼(Huffman coding)的那些事,(編碼技術介紹和程序實現)

使用iter , 和reversed 實現正、反向叠代器

使用Python之paramiko模塊和threading實現多線程登錄多臺Linux服務器

tensorflow學習筆記(三)：實現自編碼器

用javascript實現base64編碼器

Spring-boot和kafka實現消息發送器

ubuntu16。04LST配置nfs實現服務器和客戶端共享文件

安全的web服務器——使用mysqldump和mysqlbinlog實現MySQL全量與增量備份

為什麼NVIDIA NVENC 硬體H.264編碼器對XD和Horizon如此重要

pytorch 實現變分自動編碼器

增量編碼器的線數和倍頻

Django之基於session和CBV模式裝飾器實現使用者認證

VAE----變分自編碼器Keras實現

卷積去噪自編碼器專案實現

android平臺下基於ffmpeg和ANativeWindow實現簡單的視訊播放器

使用 liavformat 和 libavcodec 實現編碼器

相關推薦