ffmpeg 提取pcm 儲存為wav

阿新 • • 發佈：2018-12-17

	
    #include "stdafx.h"
	#ifdef  __cplusplus
	extern "C"
	{
	#endif
	#include "libavcodec/avcodec.h"
	#include "libavformat/avformat.h"
	#include "libavdevice/avdevice.h"
	#include "libavfilter/avfilter.h"
	#include "libavfilter/avfiltergraph.h"
	#include "libavfilter/buffersink.h"
	#include "libavfilter/buffersrc.h"
	#include "libavutil/audio_fifo.h"
	#include "libavutil/avutil.h"
	#include "libavutil/fifo.h"
	#include "libswresample/swresample.h"
	#ifdef  __cplusplus
	}
	#endif

	#include <windows.h>
	#include <conio.h>
	#include <time.h>
	#include <tchar.h>
	#include <stdio.h>
	#include <cstring>

	void writeWavHeader(AVCodecContext *pCodecCtx, AVFormatContext *pFormatCtx, FILE *audioFile);
	int openinputfile(const char* filename) ;
	#define MAX_AUDIO_FRAME_SIZE 192000
	uint64_t out_channel_layout = AV_CH_LAYOUT_STEREO;//聲道格式
    AVSampleFormat out_sample_fmt =AV_SAMPLE_FMT_S16;//取樣格式	
	AVFormatContext *ifmt_ctx = NULL;  
	int AudioStreamIndex = -1;
    int got_frame ,ret = -1;  
	//char *filename = "E:\\摩登兄弟劉宇寧 - 有多少愛可以重來.mp3";
	//char *filename="E:\\1.mp3";
	//char *filename="E:\\音訊.mp3";
	//char *filename="E:\\1.mp4";
	//char * filename="E:\\sample.mp4";
	char * filename="E:\\Nocturne.m4a";

	int main()  
	{  
		AVCodecContext *pCodecCtx;
		int channels=0;
		int sample_rate=0;
		AVPacket pkt_in, pkt_out;  
		AVFrame *frame = NULL;  
		uint8_t	 *buffer = NULL;
		struct SwrContext	*audio_convert_ctx = NULL;
		char* extention;
		av_register_all(); 

		if (openinputfile(filename) < 0)  
		{  
			printf("failed to open input file");  
			goto end;  
		}  
		extention = strrchr(filename , '.') + 1;
		int isSame= strcmp(extention,"wav");

		FILE *p = NULL;  
		char tmpName[100];
		sprintf_s(tmpName, "%s_%d_%dchannel.wav", filename, ifmt_ctx->streams[AudioStreamIndex]->codec->sample_rate, ifmt_ctx->streams[AudioStreamIndex]->codec->channels);
		p = fopen(tmpName, "w+b");
		int size = av_get_bytes_per_sample(ifmt_ctx->streams[AudioStreamIndex]->codec->sample_fmt);
		av_dump_format(ifmt_ctx, 0, filename, 0);
		if(AudioStreamIndex>=0)
		{
			 pCodecCtx=ifmt_ctx->streams[AudioStreamIndex]->codec;
			 printf("聲道數:%d\n",pCodecCtx->channels);
			 printf("時長:%d\n", ifmt_ctx->duration / 1000);
			 channels=pCodecCtx->channels;
			 sample_rate=pCodecCtx->sample_rate;
			 writeWavHeader(pCodecCtx,ifmt_ctx,p);
		}
		//音訊輸出引數
		int out_nb_samples = pCodecCtx->frame_size;//nb_samples: AAC-1024 MP3-1152 
		int out_sample_rate =pCodecCtx->sample_rate;// 44100;//取樣率
		int out_nb_channels = av_get_channel_layout_nb_channels(out_channel_layout);//根據聲道格式返回聲道個數
		int out_buffer_size = av_samples_get_buffer_size(NULL, out_nb_channels, out_nb_samples, out_sample_fmt, 1);
	 
		buffer = (uint8_t *)av_malloc(MAX_AUDIO_FRAME_SIZE);
		audio_convert_ctx = swr_alloc();
		if (audio_convert_ctx == NULL)
		{
			printf("Could not allocate SwrContext\n");
			return -1;
		}
		swr_alloc_set_opts(audio_convert_ctx, out_channel_layout, out_sample_fmt,out_sample_rate,pCodecCtx->channel_layout, pCodecCtx->sample_fmt, pCodecCtx->sample_rate, 0, NULL);
		swr_init(audio_convert_ctx);
		int frameindex=0;
		while(1)  
		{  
			if (av_read_frame(ifmt_ctx, &pkt_in) < 0)  
			{  
				break;  
			}  
			av_init_packet(&pkt_out);  
			if (AudioStreamIndex == pkt_in.stream_index)
			{
				frame = av_frame_alloc();  
				ret = avcodec_decode_audio4(ifmt_ctx->streams[AudioStreamIndex]->codec, frame, &got_frame, &pkt_in);  
				if (ret < 0)  
				{  
					av_frame_free(&frame);  
					printf("decoding audio stream failed\n");  
					break;  
				}  
				if (got_frame)  
				{
					frameindex++;

					if(isSame)
					{
					 
					  swr_convert(audio_convert_ctx, &buffer, MAX_AUDIO_FRAME_SIZE, (const uint8_t **)frame->data, frame->nb_samples<1000?1152:frame->nb_samples);
					  printf("index:%5d\t pts:%lld\t packet size:%d\n", frameindex, pkt_in.pts, pkt_in.size);
					  fwrite(buffer, 1, out_buffer_size, p);
					}
					else
					{
						if(frame->data[0])
						{
							 fwrite(frame->data[0], 1, frame->linesize[0], p);
						}
					}
				}  
			}       
		}  
		printf("總幀數:%d\n",frameindex);
		fclose(p);  
		end:  
	    swr_free(&audio_convert_ctx);
		av_free(buffer);
		avcodec_close(pCodecCtx);
		avformat_close_input(&ifmt_ctx);  
		printf("enter any key to stop\n");
		//getchar();  
		return 0;  
	}  
int openinputfile(const char* filename)  
{  
    //open the input  
    if ((ret = avformat_open_input(&ifmt_ctx, filename, NULL, NULL)) < 0)  
    {  
        printf("can not open input");  
        return ret;  
    }  
    if ((ret = avformat_find_stream_info(ifmt_ctx, NULL)))  
    {  
        printf("can not find input stream info");  
        return ret;  
    }  
    //open the decoder  
    for (int i = 0; i <(int)ifmt_ctx->nb_streams; i++)  
    {  
        if (ifmt_ctx->streams[i]->codec->codec_type == AVMEDIA_TYPE_AUDIO)  
        {  
            AudioStreamIndex = i;
            ret = avcodec_open2(ifmt_ctx->streams[i]->codec,avcodec_find_decoder(ifmt_ctx->streams[i]->codec->codec_id), NULL);  
            if (ret < 0)  
            {  
                printf("can not open decoder");  
                return ret;  
            } 
        }  
    }  
    return 0;  
}  

void writeWavHeader(AVCodecContext *pCodecCtx, AVFormatContext *pFormatCtx, FILE *audioFile)
  {
      //wav檔案有44位元組的wav頭，所以要寫44位元組的wav頭
      int8_t *data;
      UINT32 long_temp;
	  UINT16 short_temp;
      UINT16 BlockAlign;
      int bits = 8;
      UINT64 fileSize;
	  UINT64 audioDataSize;
		switch (pCodecCtx->sample_fmt) 
		{
	    case AV_SAMPLE_FMT_S16:
		    bits = 16;
		    break;
	   case AV_SAMPLE_FMT_S32:
			bits = 32;
			break;
	   case AV_SAMPLE_FMT_U8:
		   bits = 8;
			break;
	   default:
			bits = 16;
			break;
		}
		audioDataSize = (pFormatCtx->duration)*(bits / 8)*(pCodecCtx->sample_rate)*(pCodecCtx->channels);
		fileSize = audioDataSize + 36;
		data = (int8_t *)"RIFF";
		fwrite(data, sizeof(char), 4, audioFile);
		fwrite(&fileSize, sizeof(int32_t), 1, audioFile);
		data = (int8_t *)"WAVE";
		fwrite(data, sizeof(char), 4, audioFile);
		data = (int8_t *)"fmt ";
		fwrite(data, sizeof(char), 4, audioFile);
		long_temp = 16;
		fwrite(&long_temp, sizeof(int32_t), 1, audioFile);
		short_temp = 0x01;
		fwrite(&short_temp, sizeof(int16_t), 1, audioFile);
		short_temp = (pCodecCtx->channels);
		fwrite(&short_temp, sizeof(int16_t), 1, audioFile);
		long_temp = (pCodecCtx->sample_rate);
		fwrite(&long_temp, sizeof(int32_t), 1, audioFile);
		long_temp = (bits / 8)*(pCodecCtx->channels)*(pCodecCtx->sample_rate);
		fwrite(&long_temp, sizeof(int32_t), 1, audioFile);
		BlockAlign = (bits / 8)*(pCodecCtx->channels);
		fwrite(&BlockAlign, sizeof(int16_t), 1, audioFile);
		short_temp = (bits);
		fwrite(&short_temp, sizeof(int16_t), 1, audioFile);
		data = (int8_t *) "data";
		fwrite(data, sizeof(char), 4, audioFile);
		fwrite(&audioDataSize, sizeof(int32_t), 1, audioFile);
  }

ffmpeg 提取pcm 儲存為wav

#include "stdafx.h" #ifdef __cplusplus extern "C" { #endif #include "libavcodec/avcodec.h" #include "libavformat/avformat.h"

[原始碼和文件分享]程式設計實現錄音及儲存為WAV音訊檔案

背景之前自己錄製視訊教程的時候，從網上找過一些破解版錄屏軟體來使用。後來，我細想了一下，其實我自己就可以下一個簡單的錄屏小軟體。於是，後來我也自己慢慢摸索著，從網上搜索資料，慢慢地開發了一個有基本的錄音錄屏功能的小程式。其中，本文的錄音小程式是當時為了熟悉錄音流程而特意開發來練手的。當然

4.基於FFMPEG將音訊解碼為PCM

繼續FFMPEG學習之路，前面瞭解了將PCM編碼為AAC檔案，接下來則需要了解一下解碼方面，將MP3/AAC等音訊格式解碼為PCM資料，記錄一下過程。。。 1）解碼流程整個解碼流程採用虛擬碼大致如下：初始化複用器和解複用器—>獲取輸入檔案的一些資訊—->查詢解碼器

視訊幀數（圖片）提取及儲存方法---ffmpeg

視訊幀數（圖片）提取及儲存方法—ffmpeg 環境：Ubuntu16.04、Python3.5、anaconda3 任務需要，要從視訊裡提取一定幀數的圖片，查了不少方法，也試了不少方法，很多都不可行，也又可能是配置的問題，沒細究，下面把親測可行的拿出來分享，配上關鍵操作的輸出效果：

最簡單的基於FFMPEG的音訊編碼器（PCM編碼為AAC

本文介紹一個最簡單的基於FFMPEG的音訊編碼器。該編碼器實現了PCM音訊取樣資料編碼為AAC的壓縮編碼資料。編碼器程式碼十分簡單，但是每一行程式碼都很重要。通過看本編碼器的原始碼，可以瞭解FFMPEG音訊編碼的流程。本程式使用最新版的類庫（編譯時間為2014.5.6），開發平

ffmpeg4教程2:採集桌面聲音儲存為pcm

基於vs2017 vc++ ffmpeg4.0.2下測試 ffmpeg 環境配置請百度（vs2017 ffmpeg ）影象和聲音請安裝dshow便於查詢部分方法在https://blog.csdn.net/Java_lilin/article/details/8511

ffmpeg 實現RTSP/RTMP 從伺服器拉音視訊流，儲存為h264和AAC

int my_av_bsf_filter(const AVBitStreamFilter *filter, AVPacket *pPacket, const AVCodecParameters *src) { int ret; AVBSFContext *ctx = NULL; if (!fi

新版ffmpeg PCM編碼到AAC，swr_convert轉換取樣精度，稍微修改相容PCM編碼為G711A及MP3，記錄下。

#include "stdafx.h" #include <stdio.h> #include <iostream> using namespace std; extern "C" { #include "libavformat/avformat.h" #incl

京東豬臉識別比賽資料預處理：用Python將視訊每一幀提取儲存為圖片

最近參加京東的豬臉識別比賽，訓練集是30個視訊，需要將視訊的每一幀提取出來儲存為圖片，存入對應的資料夾（分類標籤）。本例是直接呼叫了cv2 模組中的 VideoCapture。一次執行，大概10分鐘，就能得到預處理後的分類圖片了，具體程式碼如下。

libjpeg庫編碼圖片為jpg(ffmpeg解碼視訊儲存圖片：RGB格式點陣圖壓縮為jpg格式圖片)

壓縮流程（結合網上大家的資料以及libjpeg庫的example.c示例：都大同小異）： 1、如何分配和初始化一個jpeg壓縮物件：在libjpeg中jpeg壓縮物件被定義為struct

利用ffmpeg進行攝像頭提取視訊編碼為h264通過RTP傳送資料到指定的rtp地址

話不多說命令如下： ffmpeg -f dshow -i video="Logitech QuickCam Easy/Cool" -vcodec libx264 -preset:v ultrafast -tune:v zerolatency -f rtp rtp://127

python 將MP3格式轉換為WAV格式（ffmpeg安裝，使用pycharm安裝包）

首先，安裝pydub，pydub是python的一個音訊處理庫處理，能對wav格式的音訊直接進行處理。如果要進行其他格式的處理就要安裝ffmpeg。所以這裡安裝pydub和ffmpeg。一：安裝pydub：你可以直接在終端安裝：pip install pydub

使用ffmpeg將BMP圖片編碼為x264視訊檔案,將H264視訊儲存為BMP圖片,yuv視訊檔案儲存為圖片的程式碼

#include <stdio.h> #include <stdlib.h> #include <string.h> #include <windows.h> #ifdef __cplusplus extern "C" { #endif #include

Android 音視訊深入十七 FFmpeg 獲取RTMP流儲存為flv （附原始碼下載）

專案地址 https://github.com/979451341/RtmpSave 這個專案主要程式碼我是從雷神那弄過來的，不愧是雷神，我就配個環境搞個介面就可以用程式碼了。這一次說的是將RTMP流媒體儲存成為一個本地的FLV檔案。因為播放視訊本身佔有很多技術難點，我先不

獲取視訊的每一幀，並儲存為.jpg圖片

#include<opencv2\opencv.hpp> #include <iostream> #include <stdio.h> #include<fstream> using namespace std; using names

簡單知識點例項之一：如何將各個單一獲取的資料儲存為陣列物件並將其取出

一、將獲取的值存為陣列或陣列物件（1）存為陣列（例如所有怪物的id值可以存為陣列）是以逗號隔開的，建議用到存單個特定值時用（如光存id值時） <!DOCTYPE html> <html lang="en"> <head> <

C#實戰小技巧（八）：將剪下板中的內容儲存為圖片

進行C#開發時，可以將複製到剪下板中的內容轉為HTML檔案，再將HTML頁面轉為圖片進行儲存，示例效果如下。被複制的Excel表格：生成的圖片：實現上述功能的主要程式碼如下，能夠將從Word、Excel、網頁等地方複製的內容匯出，並儲存為圖片。程式碼：

爬蟲資料儲存為csv檔案時，表格中間隔有空行問題

問題描述：將爬取的資料儲存的csv檔案，遇到幾個問題，原始碼如下： with open('F:\\Pythontest1\\douban.csv','w') as f: writer = csv.writer(f,dialect='excel') writer.writero

linux終端儲存為文字檔案

1. 只儲存一個命令的結果時候 ls>ls.txt 會覆蓋檔案原有內容 ls>>ls.txt 會新增到檔案末尾 2. tee 命令 ls | tee ls.txt 會覆蓋檔案原有內容 ls | tee -a ls.txt 會新增到檔案末尾

將頁面內容儲存為圖片顯示，長按儲存至本地（html2canvas）

載入的html2canvas為官網上的新版本。 style樣式: *{ margin: 0;padding: 0; font-family: "微軟雅黑"; } html,body{ width: 100%; } #capture,#imgDiv{ width: 100%; } .imgD

ffmpeg 提取pcm 儲存為wav

相關推薦