ffmpeg官方例程3学习-给视频播放加上声音

在上一篇中简单设计了一个视频播放器，但是没有声音，于是本篇的代码就是在上一篇的基础上加上声音。
在ffmpeg给的官方例程中，给视频添加声音是有问题的，这一块可以参考下面的这篇博客：
http://www.cnblogs.com/ansersion/p/5265033.html
其中播放声音比较ffmpeg以前版本增加了重采样的概念，而我添加声音这块代码也是参考这篇博客得来。
代码是在上一篇的基础上添加，对于之前的代码几乎没有删改，程序最终运行效果为视频跑的很快，但是声音则正常播放。
开发环境：
　　操作系统：ubuntu14
　　ffmpeg版本：3.2.2
　　sdl版本：2
编译与运行：
gcc -g main.c -o test -I /usr/local/ffmpeg/include -L /usr/local/ffmpeg/lib -lavutil -lavformat -lavcodec -lz -lavutil -lswscale -L /usr/lib/x86_64-linux-gnu -lSDL2 -lSDL2main（其中路径按照自己的安装路径来 -g 是加GDB调试）
./test
  1 #ifdef _cplusplus  2 extern "C"  3 {  4 #endif  5   6 #include<stdio.h>  7 #include<assert.h>  8 #include<libavcodec/avcodec.h>  9 #include<libavformat/avformat.h> 10 #include<libavutil/avutil.h> 11 #include<libswscale/swscale.h> 12 #include <libswresample/swresample.h> 13 #include<libavutil/avutil.h> 14 #include<libavutil/imgutils.h> 15 #include<SDL2/SDL.h> 16 #include<SDL2/SDL_thread.h> 17  18 //是否将YUV420P内容输出到文件 19 #define OUTPUT_YUV420P 0 20 //要播放的文件路径 21 #define filename "/home/sns/test.flv" 22 //要输出YUV420P内容的文件路径 23 #define outfilename "/home/sns/output.yuv" 24  25 #define SDL_AUDIO_BUFFER_SIZE 1024 26 #define MAX_AUDIO_FRAME_SIZE 192000 27 //结构体定义 28 typedef struct PacketQueue{ 29     AVPacketList *first_pkt,*last_pkt;//队首、队尾 30     int nb_packets;    //包的个数 31     int size;//队列的字节数 32     SDL_mutex *mutex;//互斥量 33     SDL_cond    *cond;//条件变量 34 }PacketQueue; 35  36 typedef struct AudioParams { 37     int freq; 38     int channels; 39     int64_t channel_layout; 40     enum AVSampleFormat fmt; 41     int frame_size; 42     int bytes_per_sec; 43 } AudioParams; 44 //函数定义 45 static void audio_callback(void *userdata, Uint8 * stream, int len);// 46 static int packet_queue_get(PacketQueue *q,AVPacket *pkt,int block); 47 int    packet_queue_put(PacketQueue *q,AVPacket *pkt); 48 void packet_queue_init(PacketQueue *q); 49 static int audio_decode_frame(AVCodecContext *aCodecCtx,uint8_t *audio_buf,int buf_size); 50 int resample(AVFrame *af,uint8_t *audio_buf,int *audio_buf_size); 51  52 //全局变量定义 53 int quit =0; 54 PacketQueue audioQ; 55 int sample_rate, nb_channels; 56 int64_t channel_layout; 57 struct SwrContext * swr_ctx = NULL; 58 AudioParams audio_hw_params_tgt; 59 AudioParams audio_hw_params_src; 60  61 //主函数 62 int main(int argc, char **argv) 63 { 64     //变量定义********************************************************************* 65     AVFormatContext *pFormatCtx; 66     int i=0; 67     int videoStream; 68     int audioStream; 69     AVCodecContext *pCodecCtx; 70     AVCodecContext  *aCodecCtxOrig; 71     AVCodecContext *aCodecCtx; 72     AVCodec *pCodec; 73     AVCodec *aCodec; 74     AVFrame *pFrame; 75     AVFrame *pFrameYUV; 76     uint8_t *buffer; 77     int numBytes; 78  79     SDL_Window *screen; 80     SDL_Renderer *sdlRender; 81     SDL_Texture *sdlTexture; 82     SDL_Rect sdlRect; 83     int frameFinished; 84     AVPacket packet; 85     struct SwsContext *img_convert_ctx; 86     int err_code; 87     char buf[1024]; 88     FILE *fp_yuv; 89     int y_size; 90     SDL_AudioSpec audioSpec; 91     SDL_AudioSpec spec; 92     SDL_Event       event; 93     //******************************************************************************* 94     av_register_all(); 95     //1、打开视频文件************************************************* 96     pFormatCtx = avformat_alloc_context(); 97     err_code = avformat_open_input(&pFormatCtx, filename, NULL, NULL); 98     if (err_code != 0) 99     {//打开文件失败100         av_strerror(err_code, buf, 1024);101         printf("coundn't open the file!,error code = %d(%s)\n", err_code, buf);102         return -1;103     }104     if (avformat_find_stream_info(pFormatCtx, NULL) < 0)105     {106         printf("Couldn't find stream information.\n");107         return -1;108     }109     // 打印信息110       av_dump_format(pFormatCtx, 0, filename, 0);111     //2、找到第一个视频流和第一个音频流****************************112     videoStream = -1;113     audioStream = -1;114     for (i = 0; i < pFormatCtx->nb_streams; i++)115     {116         if (pFormatCtx->streams[i]->codec->codec_type == AVMEDIA_TYPE_VIDEO && videoStream<0)117         {118             videoStream = i;//得到视频流的索引119         }120         if(pFormatCtx->streams[i]->codec->codec_type == AVMEDIA_TYPE_AUDIO &&audioStream < 0)121         {122             audioStream = i;//得到音频流的索引123         }124     }125     if (videoStream == -1)126     {127         printf("Didn't find a video stream.\n");128         return -1;129     }130     if(audioStream == -1)131     {132         printf("coundn't find a audio stream!\n");133         return -1;134     }135     /* 3、从视频流中得到一个音频和视频编解码上下文,里面包含了编解码器的所有信息和一个136     指向真正的编解码器     ,然后我们找到音频和视频编解码器*/137     pCodecCtx = pFormatCtx->streams[videoStream]->codec;138     aCodecCtxOrig = pFormatCtx->streams[audioStream]->codec;139     pCodec = avcodec_find_decoder(pCodecCtx->codec_id);140     aCodec = avcodec_find_decoder(aCodecCtxOrig->codec_id);141     if (pCodec == NULL)142     {143         fprintf(stderr, "Unsupported codec !\n");144         return -1;145     }146     if(aCodec == NULL)147     {148         fprintf(stderr,"Unsupported codec!\n");149         return -1;150     }151     //拷贝上下文152     aCodecCtx = avcodec_alloc_context3(aCodec);153     if(avcodec_copy_context(aCodecCtx,aCodecCtxOrig) != 0)154     {155         fprintf(stderr,"couldn't copy codec context!\n");156         return -1;157     }158     //4、打开音频和视频编解码器159     if (avcodec_open2(pCodecCtx, pCodec, NULL) < 0)160     {161         printf("cann't open the codec!\n");162         return -1;163     }164     if(avcodec_open2(aCodecCtx,aCodec,NULL) < 0 )165     {166         printf("cann't open the audio codec!\n");167         return -1;168     }169     //设置声音参数170     sample_rate = aCodecCtx->sample_rate;171     nb_channels = aCodecCtx->channels;172     channel_layout = aCodecCtx->channel_layout;173 174 //    printf("channel_layout=%" PRId64 "\n", channel_layout);175     printf("nb_channels=%d\n", nb_channels);176     printf("freq=%d\n", sample_rate);177 178     if (!channel_layout|| nb_channels != av_get_channel_layout_nb_channels(channel_layout))179     {180         channel_layout = av_get_default_channel_layout(nb_channels);181         channel_layout &= ~AV_CH_LAYOUT_STEREO_DOWNMIX;182         printf("correction\n");183     }184     /*通故编解码上下文中的所有信息来建立音频的信息*/185     audioSpec.freq = aCodecCtx->sample_rate;186     audioSpec.format = AUDIO_S16SYS;187     audioSpec.channels = aCodecCtx->channels;188     audioSpec.silence = 0;189     audioSpec.samples = SDL_AUDIO_BUFFER_SIZE;190     audioSpec.callback = audio_callback;191     audioSpec.userdata = aCodecCtx;192     //打开音频设备和初始化193     if(SDL_OpenAudio(&audioSpec,&spec) < 0)194     //其中回调函数在需要更多音频数据的时候被调用（即播放完后需要从回调取数据播放）195     {196         fprintf(stderr,"SDL_OpenAudio:    %s\n",SDL_GetError());197         return -1;198     }199     printf("freq: %d\tchannels: %d\n", spec.freq, spec.channels);200     //5、分配两个视频帧，一个保存得到的原始视频帧，一个保存为指定格式的视频帧（该帧通过原始帧转换得来）201     pFrame = av_frame_alloc();202     if (pFrame == NULL)203     {204         printf("pFrame alloc fail!\n");205         return -1;206     }207     pFrameYUV = av_frame_alloc();208     if (pFrameYUV == NULL)209     {210         printf("pFrameYUV alloc fail!\n");211         return -1;212     }213     //6、得到一帧视频截图的内存大小并分配内存，并将YUV数据填充进去214     numBytes = av_image_get_buffer_size(AV_PIX_FMT_YUV420P, pCodecCtx->width,215             pCodecCtx->height,1);216     buffer = (uint8_t*) av_mallocz(numBytes * sizeof(uint8_t));217     if (!buffer)218     {219         printf("numBytes :%d , buffer malloc 's mem \n", numBytes);220         return -1;221     }222     //打印信息223     printf("--------------- File Information ----------------\n");224     av_dump_format(pFormatCtx, 0, filename, 0);225     printf("-------------------------------------------------\n");226     av_image_fill_arrays(pFrameYUV->data, pFrameYUV->linesize,buffer,227             AV_PIX_FMT_YUV420P,pCodecCtx->width, pCodecCtx->height,1);228     //7、得到指定转换格式的上下文**********************************229     img_convert_ctx = sws_getContext(pCodecCtx->width, pCodecCtx->height,230             pCodecCtx->pix_fmt, pCodecCtx->width, pCodecCtx->height,231             AV_PIX_FMT_YUV420P,232             SWS_BICUBIC,233             NULL, NULL, NULL);234     if (img_convert_ctx == NULL)235     {236         fprintf(stderr, "Cannot initialize the conversion context!\n");237         return -1;238     }239     //***********************************************************240 #if OUTPUT_YUV420P241     fp_yuv = fopen(outfilename, "wb+");242 #endif243     //8、SDL初始化和创建多重windows等准备工作244     if (SDL_Init(SDL_INIT_AUDIO | SDL_INIT_TIMER | SDL_INIT_VIDEO))245     {246         fprintf(stderr, "Could not initialize SDL - %s\n", SDL_GetError());247         return -1;248     }249     //使用SDL_CreateWindow代替SDL_SetVideoMode250     //创建一个给定高度和宽度、位置和标示的windows。251     screen = SDL_CreateWindow("Simplest ffmpeg player's Window",252     SDL_WINDOWPOS_UNDEFINED, SDL_WINDOWPOS_UNDEFINED, pCodecCtx->width,253             pCodecCtx->height, SDL_WINDOW_OPENGL);254     if (!screen)255     {256         fprintf(stderr, "SDL: could not create window - exiting - %s\n",SDL_GetError());257         return -1;258     }259     //对该window创建一个2D渲染上下文260     sdlRender = SDL_CreateRenderer(screen, -1, 0);261     if (!sdlRender)262     {263         fprintf(stderr, "SDL:cound not create render :    %s\n", SDL_GetError());264         return -1;265     }266     //Create a texture for a rendering context.267     //为一个渲染上下文创建一个纹理268     //IYUV: Y + U + V  (3 planes)269     //YV12: Y + V + U  (3 planes)270     sdlTexture = SDL_CreateTexture(sdlRender, SDL_PIXELFORMAT_IYUV,271             SDL_TEXTUREACCESS_STREAMING, pCodecCtx->width, pCodecCtx->height);272     if (!sdlTexture)273     {274         fprintf(stderr, "SDL:cound not create Texture :    %s\n", SDL_GetError());275         return -1;276     }277     //建立一个矩形变量，提供后面使用278     sdlRect.x = 0;279     sdlRect.y = 0;280     sdlRect.w = pCodecCtx->width;281     sdlRect.h = pCodecCtx->height;282     //*****************************************************283     //声音部分代码284     audio_hw_params_tgt.fmt = AV_SAMPLE_FMT_S16;285     audio_hw_params_tgt.freq = spec.freq;286     audio_hw_params_tgt.channel_layout = channel_layout;287     audio_hw_params_tgt.channels = spec.channels;288     audio_hw_params_tgt.frame_size = av_samples_get_buffer_size(NULL,289     audio_hw_params_tgt.channels, 1, audio_hw_params_tgt.fmt, 1);290     audio_hw_params_tgt.bytes_per_sec = av_samples_get_buffer_size(NULL,291             audio_hw_params_tgt.channels, audio_hw_params_tgt.freq,292             audio_hw_params_tgt.fmt, 1);293     if (audio_hw_params_tgt.bytes_per_sec <= 0|| audio_hw_params_tgt.frame_size <= 0)294     {295         printf("size error\n");296         return -1;297     }298     audio_hw_params_src = audio_hw_params_tgt;299     //*****************************************************300     packet_queue_init(&audioQ);301     SDL_PauseAudio(0);302     //9、正式开始读取数据*****************************************303     while (av_read_frame(pFormatCtx, &packet) >= 0)304     {305         //如果读取的包来自视频流306         if (packet.stream_index == videoStream)307         {308             //从包中得到解码后的帧309             if (avcodec_decode_video2(pCodecCtx, pFrame, &frameFinished,&packet) < 0)310             {311                 printf("Decode Error!\n");312                 return -1;313             }314             //如果确定完成得到该视频帧315             if (frameFinished)316             {317                 //转换帧数据格式318                 sws_scale(img_convert_ctx, pFrame->data, pFrame->linesize, 0,319                         pCodecCtx->height,320                         pFrameYUV->data,321                         pFrameYUV->linesize);322 #if OUTPUT_YUV420P323                 y_size = pCodecCtx->width * pCodecCtx->height;324                 fwrite(pFrameYUV->data[0], 1, y_size, fp_yuv);    //Y325                 fwrite(pFrameYUV->data[1], 1, y_size / 4, fp_yuv);  //U326                 fwrite(pFrameYUV->data[2], 1, y_size / 4, fp_yuv);  //V327 #endif328                 //SDL显示~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~329 #if 0330                 SDL_UpdateTexture(sdlTexture,NULL,pFrameYUV->data[0],pFrameYUV->linesize[0]);331 #else332                 SDL_UpdateYUVTexture(sdlTexture, &sdlRect, pFrameYUV->data[0],333                         pFrameYUV->linesize[0], pFrameYUV->data[1],334                         pFrameYUV->linesize[1], pFrameYUV->data[2],335                         pFrameYUV->linesize[2]);336 #endif337                 SDL_RenderClear(sdlRender);338                 SDL_RenderCopy(sdlRender, sdlTexture, NULL, &sdlRect);339                 SDL_RenderPresent(sdlRender);340                 //结束SDL~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~341             }342         }343         else if(packet.stream_index == audioStream)344         {345                 packet_queue_put(&audioQ,&packet);346         }else{347                 av_free_packet(&packet);//释放读出来的包348         }349         SDL_PollEvent(&event);350         switch (event.type)351         {352         case SDL_QUIT:353             quit = 1;354             SDL_Quit();355             exit(0);356             break;357         default:358             break;359         }360     }361     while(1) SDL_Delay(1000);362     //**************************************************************************************363     //10、释放分配的内存或关闭文件等操作364 #if OUTPUT_YUV420P365     fclose(fp_yuv);366 #endif367     sws_freeContext(img_convert_ctx);368     SDL_Quit();369     av_free(buffer);370     av_free(pFrame);371     av_free(pFrameYUV);372     avcodec_close(pCodecCtx);373     avcodec_close(aCodecCtxOrig);374     avcodec_close(aCodecCtx);375     avformat_close_input(&pFormatCtx);376     return EXIT_SUCCESS;377 }378 379 380 static void audio_callback(void *userdata, Uint8 * stream, int len)381 {382     AVCodecContext *aCodecCtx = (AVCodecContext*)userdata;383     int len1,audio_size;384     static uint8_t audio_buf[(MAX_AUDIO_FRAME_SIZE*3)/2];385     static unsigned int audio_buf_size = 0;386     static unsigned int audio_buf_index =0;387     while(len>0){388         if(audio_buf_index >= audio_buf_size){389             audio_size = audio_decode_frame(aCodecCtx,audio_buf,sizeof(audio_buf));390             if(audio_size < 0){391                 audio_buf_size = 1024;392                 memset(audio_buf,0,audio_buf_size);393             }else{394                 audio_buf_size = audio_size;395             }396             audio_buf_index = 0;397         }398         len1 = audio_buf_size - audio_buf_index;399         if(len1 > len)400         len1 = len;401         memcpy(stream, (uint8_t *)audio_buf + audio_buf_index, len1);402         len -= len1;403         stream += len1;404         audio_buf_index += len1;405     }406 }407 408 void packet_queue_init(PacketQueue *q)409 {410     memset(q,0,sizeof(PacketQueue));411     q->mutex = SDL_CreateMutex();412     q->cond = SDL_CreateCond();413 }414 415 int    packet_queue_put(PacketQueue *q,AVPacket *pkt)416 {417     AVPacketList *pkt1;418     if(av_dup_packet(pkt)<0)419     {420         printf("dup packet error!\n");421         return -1;422     }423     pkt1 = av_malloc(sizeof(AVPacketList));424     if(!pkt1)425     {426         printf("malloc AVPacketList error!\n");427         return -1;428     }429     pkt1->pkt = *pkt;430     pkt1->next = NULL;431     SDL_LockMutex(q->mutex);432     if(!q->last_pkt){433         q->first_pkt = pkt1;434     }else{435         q->last_pkt->next = pkt1;436     }437     q->last_pkt = pkt1;438     q->nb_packets ++;439     q->size +=pkt1->pkt.size;440     SDL_CondSignal(q->cond);441     SDL_UnlockMutex(q->mutex);442     return 0;443 }444 static int packet_queue_get(PacketQueue *q,AVPacket *pkt,int block){445     int ret;446     AVPacketList *pkt1;447     SDL_LockMutex(q->mutex);448     for(;;){449         if(quit){450             printf("packet_queue has quit!\n");451             ret =-1;452             break;453         }454         pkt1 = q->first_pkt;455         if(pkt1){456             q->first_pkt = pkt1->next;457             if(!q->first_pkt){458                 q->last_pkt = NULL;459             }460             q->nb_packets--;461             q->size -= pkt1->pkt.size;462             *pkt = pkt1->pkt;463             av_free(pkt1);464             ret =1;465             break;466         }else if(!block){467             ret =0;468             break;469         }else{470             SDL_CondWait(q->cond,q->mutex);//做了解锁互斥量的动作471         }472     }473     SDL_UnlockMutex(q->mutex);474     return ret;475 }476 static int audio_decode_frame(AVCodecContext *aCodecCtx,uint8_t *audio_buf,int buf_size)477 {478     static AVPacket pkt;479     static uint8_t *audio_pkt_data = NULL;480     static int audio_pkt_size = 0;481     int len1,data_size=0;482     static AVFrame frame;483     int got_frame=0;484 485     for(;;){486         while(audio_pkt_size >0 ){487             len1 = avcodec_decode_audio4(aCodecCtx, &frame, &got_frame, &pkt);488             if (len1 < 0)489             {490                 /* if error, skip frame */491                 audio_pkt_size = 0;492                 break;493             }494             audio_pkt_data += len1;495             audio_pkt_size -= len1;496             data_size =0;497             if(got_frame){498                 data_size = resample(&frame, audio_buf, &buf_size);499                 assert(data_size <= buf_size);500             }501             if (data_size <= 0)502             {503                 /* No data yet, get more frames */504                 continue;505             }506             /* We have data, return it and come back for more later */507             return data_size;508         }509         if (pkt.data)510             av_free_packet(&pkt);511         if (quit)512         {513             return -1;514         }515         if (packet_queue_get(&audioQ, &pkt, 1) < 0)516         {517             printf("packet_queue_get error!\n");518             return -1;519         }520         audio_pkt_data = pkt.data;521         audio_pkt_size = pkt.size;522     }523     return 1;524 }525 526 //重采样527 int resample(AVFrame *af, uint8_t *audio_buf, int *audio_buf_size)528 {529     int data_size = 0;530     int resampled_data_size = 0;531     int64_t dec_channel_layout;532     data_size = av_samples_get_buffer_size(NULL,533             av_frame_get_channels(af),534             af->nb_samples,535             af->format, 1);536     dec_channel_layout =(af->channel_layout&&537             av_frame_get_channels(af)== av_get_channel_layout_nb_channels(538                                     af->channel_layout)) ?539                     af->channel_layout :540                     av_get_default_channel_layout(av_frame_get_channels(af));541     if (af->format != audio_hw_params_src.fmt542             || af->sample_rate != audio_hw_params_src.freq543             || dec_channel_layout != audio_hw_params_src.channel_layout544             || !swr_ctx)545     {546         swr_free(&swr_ctx);547         swr_ctx = swr_alloc_set_opts(NULL, audio_hw_params_tgt.channel_layout,548                 audio_hw_params_tgt.fmt, audio_hw_params_tgt.freq,549                 dec_channel_layout, af->format, af->sample_rate, 0, NULL);550         if (!swr_ctx || swr_init(swr_ctx) < 0)551         {552             av_log(NULL, AV_LOG_ERROR,553                     "Cannot create sample rate converter for conversion of %d Hz %s %d channels to %d Hz %s %d channels!\n",554                     af->sample_rate, av_get_sample_fmt_name(af->format),555                     av_frame_get_channels(af), audio_hw_params_tgt.freq,556                     av_get_sample_fmt_name(audio_hw_params_tgt.fmt),557                     audio_hw_params_tgt.channels);558             swr_free(&swr_ctx);559             return -1;560         }561         printf("swr_init\n");562         audio_hw_params_src.channels = av_frame_get_channels(af);563         audio_hw_params_src.fmt = af->format;564         audio_hw_params_src.freq = af->sample_rate;565     }566 567     if (swr_ctx)568     {569         const uint8_t **in = (const uint8_t **) af->extended_data;570         uint8_t **out = &audio_buf;571         int out_count = (int64_t) af->nb_samples * audio_hw_params_tgt.freq572                 / af->sample_rate + 256;573         int out_size = av_samples_get_buffer_size(NULL,574                 audio_hw_params_tgt.channels, out_count,575                 audio_hw_params_tgt.fmt, 0);576         int len2;577         if (out_size < 0)578         {579             av_log(NULL, AV_LOG_ERROR, "av_samples_get_buffer_size() failed\n");580             return -1;581         }582         av_fast_malloc(&audio_buf, audio_buf_size, out_size);583         if (!audio_buf)584             return AVERROR(ENOMEM);585         len2 = swr_convert(swr_ctx, out, out_count, in, af->nb_samples);586         if (len2 < 0)587         {588             av_log(NULL, AV_LOG_ERROR, "swr_convert() failed\n");589             return -1;590         }591         if (len2 == out_count)592         {593             av_log(NULL, AV_LOG_WARNING,594                     "audio buffer is probably too small\n");595             if (swr_init(swr_ctx) < 0)596                 swr_free(&swr_ctx);597         }598         resampled_data_size = len2 * audio_hw_params_tgt.channels599                 * av_get_bytes_per_sample(audio_hw_params_tgt.fmt);600     }601     else602     {603         audio_buf = af->data[0];604         resampled_data_size = data_size;605     }606 607     return resampled_data_size;608 }609 610 #ifdef _cplusplus611 }612 #endif
代码那么多，不好理解呀～～～～～
所以程序还是最好模块化和分文件来做才行，或者封装成一个类。
会得到最大的满足，因为它填补了你的空虚。
相关文章：

你感兴趣的文章：

标签云：