zsc09_leaf

从ffmpeg源代码分析如何解决ffmpeg编码的延迟问题(如何解决编码 0 延时)

在看到这篇文章前我已经解决了这个问题，但是知其然不知其所以然，看到原作者写的文章很详细。

于是转之，感谢原作者。

原文链接：http://blog.csdn.net/ymsdu2004/article/details/8565822

FFMPEG中如果你编码完一段视频发现视频变短了，那很有可能就是没有设置0延时的原因。

近日在做一个分布式转码服务器，解码器是采用开源的ffmpeg，在开发的过程中遇到一个问题：编码延迟多大5、6秒钟，也就是最初编码的几十帧并不能马上取出，而我们的要求是实时编码！虽然我对视频编码方面不是很熟悉，但根据开发的经验，我想必定可以通过设置一些参数来改变这些情况。但我本人接触ffmpeg项目时间并不长，对很多与编解码方面参数的设置并不熟悉，于是google了很久，网上也有相关方面的讨论，说什么的都有，但我试了不行，更有甚者说修改源代码的，这个可能能够解决问题，但修改源代码毕竟不是解决问题的最佳途径。于是决定分析一下源代码，跟踪源码来找出问题的根源。

首先我使用的ffmpeg源代码版本是1.0.3，同时给出我的测试代码，项目中的代码就不给出来了，我给个简单的玩具代码：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">/** 
  * @file 
  * libavcodec API use example. 
  * 
  * Note that libavcodec only handles codecs (mpeg, mpeg4, etc...), 
  * not file formats (avi, vob, mp4, mov, mkv, mxf, flv, mpegts, mpegps, etc...). See library 'libavformat' for the 
  * format handling 
  */  
   
 #if _MSC_VER  
 #define snprintf _snprintf  
 #endif  
   
 #include   
 #include   
   
 extern "C" {  
 #include         // for av_opt_set  
 #include   
 #include   
 };  
   
 /* 
  * Video encoding example 
  */  
 static void video_encode_example(const char *filename, int codec_id)  
 {  
     AVCodec *codec;  
     AVCodecContext *c= NULL;  
     int i, ret, x, y, got_output;  
     FILE *f;  
     AVFrame *picture;  
     AVPacket pkt;  
     uint8_t endcode[] = { 0, 0, 1, 0xb7 };  
   
     printf("Encode video file %s\n", filename);  
   
     /* find the mpeg1 video encoder */  
     codec = avcodec_find_encoder((AVCodecID)codec_id);  
     if (!codec) {  
         fprintf(stderr, "codec not found\n");  
         exit(1);  
     }  
   
     c = avcodec_alloc_context3(codec);  
   
     /* put sample parameters */  
     c->bit_rate = 400000;  
     /* resolution must be a multiple of two */  
     c->width = 800/*352*/;  
     c->height = 500/*288*/;  
     /* frames per second */  
     c->time_base.den = 1;  
     c->time_base.num = 25;  
     c->gop_size = 10; /* emit one intra frame every ten frames */  
     c->max_b_frames=1;  
     c->pix_fmt = PIX_FMT_YUV420P;  
   
     /* open it */  
     if (avcodec_open2(c, codec, NULL) < 0) {  
         fprintf(stderr, "could not open codec\n");  
         exit(1);  
     }  
   
     f = fopen(filename, "wb");  
     if (!f) {  
         fprintf(stderr, "could not open %s\n", filename);  
         exit(1);  
     }  
   
     picture = avcodec_alloc_frame();  
     if (!picture) {  
         fprintf(stderr, "Could not allocate video frame\n");  
         exit(1);  
     }  
     picture->format = c->pix_fmt;  
     picture->width  = c->width;  
     picture->height = c->height;  
   
     /* the image can be allocated by any means and av_image_alloc() is 
      * just the most convenient way if av_malloc() is to be used */  
     ret = av_image_alloc(picture->data, picture->linesize, c->width, c->height,  
                          c->pix_fmt, 32);  
     if (ret < 0) {  
         fprintf(stderr, "could not alloc raw picture buffer\n");  
         exit(1);  
     }  
   
     static int delayedFrame = 0;  
     /* encode 1 second of video */  
     for(i=0;i<25;i++) {  
         av_init_packet(&pkt);  
         pkt.data = NULL;    // packet data will be allocated by the encoder  
         pkt.size = 0;  
   
         fflush(stdout);  
         /* prepare a dummy image */  
         /* Y */  
         for(y=0;yheight;y++) {  
             for(x=0;xwidth;x++) {  
                 picture->data[0][y * picture->linesize[0] + x] = x + y + i * 3;  
             }  
         }  
   
         /* Cb and Cr */  
         for(y=0;yheight/2;y++) {  
             for(x=0;xwidth/2;x++) {  
                 picture->data[1][y * picture->linesize[1] + x] = 128 + y + i * 2;  
                 picture->data[2][y * picture->linesize[2] + x] = 64 + x + i * 5;  
             }  
         }  
   
         picture->pts = i;  
   
         printf("encoding frame %3d----", i);  
         /* encode the image */  
         ret = avcodec_encode_video2(c, &pkt, picture, &got_output);  
         if (ret < 0) {  
             fprintf(stderr, "error encoding frame\n");  
             exit(1);  
         }  
   
         if (got_output) {  
             printf("output frame %3d (size=%5d)\n", i-delayedFrame, pkt.size);  
             fwrite(pkt.data, 1, pkt.size, f);  
             av_free_packet(&pkt);  
         }  
         else {  
             delayedFrame++;  
             printf("no output frame\n");  
         }  
     }  
   
     /* get the delayed frames */  
     for (got_output = 1; got_output; i++) {  
         fflush(stdout);  
   
         ret = avcodec_encode_video2(c, &pkt, NULL, &got_output);  
         if (ret < 0) {  
             fprintf(stderr, "error encoding frame\n");  
             exit(1);  
         }  
   
         if (got_output) {  
             printf("output delayed frame %3d (size=%5d)\n", i-delayedFrame, pkt.size);  
             fwrite(pkt.data, 1, pkt.size, f);  
             av_free_packet(&pkt);  
         }  
     }  
   
     /* add sequence end code to have a real mpeg file */  
     fwrite(endcode, 1, sizeof(endcode), f);  
     fclose(f);  
   
     avcodec_close(c);  
     av_free(c);  
     av_freep(&picture->data[0]);  
     av_free(picture);  
     printf("\n");  
 }  
   
 int main(int argc, char **argv)  
 {  
     /* register all the codecs */  
     avcodec_register_all();  
   
     video_encode_example("test.h264", AV_CODEC_ID_H264);  
   
     system("pause");  
   
     return 0;  
 }  

运行上面的代码，我们编码25帧，发现延迟了多达18帧，如下图所示：

现在我们开始分析ffmpeg的源代码（因为ffmpeg的编码器是基于X264项目的，所以我们的代码还要追踪带X264中去）：

avcodec_register_all()做了些什么

因为我们关心的是H.264的编码所以我们只关心该函数中对X264编码器做了些什么，该函数主要是注册ffmpeg提供的所有编解码器，由于该函数较长，但都是相同的动作（注册编解码器），所以我们只列出部分的代码：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">void avcodec_register_all(void)  
 {  
     static int initialized;  
   
     if (initialized)  
         return;  
     initialized = 1;  
   
     /* hardware accelerators */  
     REGISTER_HWACCEL (H263_VAAPI, h263_vaapi);  
     REGISTER_HWACCEL (H264_DXVA2, h264_dxva2);  
     ......  
   
     /* video codecs */  
     REGISTER_ENCODER (A64MULTI, a64multi);  
     REGISTER_ENCODER (A64MULTI5, a64multi5);  
     ......  
   
     /* audio codecs */  
     REGISTER_ENCDEC  (AAC, aac);  
     REGISTER_DECODER (AAC_LATM, aac_latm);  
     ......  
   
     /* PCM codecs */  
     REGISTER_ENCDEC  (PCM_ALAW, pcm_alaw);  
     REGISTER_DECODER (PCM_BLURAY, pcm_bluray);  
     ......  
   
     /* DPCM codecs */  
     REGISTER_DECODER (INTERPLAY_DPCM, interplay_dpcm);  
     REGISTER_ENCDEC  (ROQ_DPCM, roq_dpcm);  
     ......  
   
     /* ADPCM codecs */  
     REGISTER_DECODER (ADPCM_4XM, adpcm_4xm);  
     REGISTER_ENCDEC  (ADPCM_ADX, adpcm_adx);  
     ......  
   
     /* subtitles */  
     REGISTER_ENCDEC  (ASS, ass);  
     REGISTER_ENCDEC  (DVBSUB, dvbsub);  
     ......  
   
     /* external libraries */  
     REGISTER_DECODER (LIBCELT, libcelt);  
     ......  
   
 "color:#ff6666;">    //////////////////////////////////////////////  
     // 这是我们关注的libx264编码器  
     REGISTER_ENCODER (LIBX264, libx264);  
     ......  
   
     /* text */  
     REGISTER_DECODER (BINTEXT, bintext);  
     ......  
   
     /* parsers */  
     REGISTER_PARSER  (AAC, aac);  
     REGISTER_PARSER  (AAC_LATM, aac_latm);  
     ......  
   
     /* bitstream filters */  
     REGISTER_BSF     (AAC_ADTSTOASC, aac_adtstoasc);  
     REGISTER_BSF     (CHOMP, chomp);  
     ......  
 }  

很显然，我们关心的是REGISTER_ENCODER (LIBX264, libx264)，这里是注册libx264编码器：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">#define REGISTER_ENCODER(X,x) { \  
           extern AVCodec ff_##x##_encoder; \  
           if(CONFIG_##X##_ENCODER)  avcodec_register(&ff_##x##_encoder); }  

将宏以参数LIBX264和libx264展开得到：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">{  
     extern AVCodec ff_libx264_encoder;  
     if (CONFIG_LIBX264_ENCODER)  
         avcodec_register(&ff_libx264_encoder);  
 }  

在ffmpeg中查找ff_libx264_encoder变量：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">AVCodec ff_libx264_encoder = {  
     .name             = "libx264",  
     .type             = AVMEDIA_TYPE_VIDEO,  
     .id               = AV_CODEC_ID_H264,  
     .priv_data_size   = sizeof(X264Context),  
     "color:#ff6666;">.init             = X264_init,  
     .encode2          = X264_frame,  
     .close            = X264_close,  
     .capabilities     = CODEC_CAP_DELAY | CODEC_CAP_AUTO_THREADS,  
     .long_name        = NULL_IF_CONFIG_SMALL("libx264 H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),  
     .priv_class       = &class,  
     .defaults         = x264_defaults,  
     .init_static_data = X264_init_static,  
 };  

看到这个结构体中的init成员，我们可以推测这个成员注册的X264_init函数一定是对X264编码器的各项参数做初始化工作，这给我们提供了继续查找下去的线索，稍后我们来分析，这里有个条件判断CONFIG_LIBX264_ENCODER，我们在ffmpeg工程中查找，发现在它Config.mak中，这个文件是在咱们编译ffmpeg工程时由./configure根据你的选项自动生成的，还记得我们编译时用了--enable-libx264选项吗(我们要使用X264编码器，当然要指定该选项)？所以有CONFIG_LIBX264_ENCODER=yes，因此这里可以成功注册x264编码器，如果当初没有指定该选项，编码器是不会注册进去的。

而avcodec_register则是将具体的codec注册到编解码器链表中去：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">void avcodec_register(AVCodec *codec)  
 {  
     AVCodec **p;  
     avcodec_init();  
     p = &first_avcodec;  
     while (*p != NULL) p = &(*p)->next;  
     *p = codec;  
     codec->next = NULL;  
   
     if (codec->init_static_data)  
         codec->init_static_data(codec);  
 }  

这里first_avcodec是一个全局变量，作为编解码器链表的起始位置，之后注册的编解码器都加入到这个链表中去。

avcodec_find_encoder

该函数就是在编解码器链表中找出你需要的codec，如果你之前没有注册该device，将会查找失败，从代码中可以看出，它就是中first_avcodec开始查找每个节点，比较每个device的id是否与你参数给的一直，如果是，则找到了，并返回之：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">AVCodec *avcodec_find_encoder(enum AVCodecID id)  
 {  
     AVCodec *p, *experimental=NULL;  
     p = first_avcodec;  
     id= remap_deprecated_codec_id(id);  
     while (p) {  
         if (av_codec_is_encoder(p) && p->id == id) {  
             if (p->capabilities & CODEC_CAP_EXPERIMENTAL && !experimental) {  
                 experimental = p;  
             } else  
                 return p;  
         }  
         p = p->next;  
     }  
     return experimental;  
 }  

至此你应该理解了为什么每次使用编码器前，我们都会先调用avcodec_register_all或者avcodec_register，你也了解到了为什么你调用了avcodec_register_all，但查找AV_CODEC_ID_H264编码器时会还是会失败（因为你编译ffmpeg时未指定--enable-libx264）。

打开编码器，avcodec_open2

这个函数主要是打开你找到的编码器，所谓打开其实是设置编码器的各项参数，要设置的参数数据则是从我么设置的AVCodecContext来获得的。

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">int attribute_align_arg avcodec_open2(AVCodecContext *avctx, const AVCodec *codec, AVDictionary **options)  
 {  
     int ret = 0;  
     AVDictionary *tmp = NULL;  
   
     if (avcodec_is_open(avctx))  
         return 0;  
   
     if ((!codec && !avctx->codec)) {  
         av_log(avctx, AV_LOG_ERROR, "No codec provided to avcodec_open2().\n");  
         return AVERROR(EINVAL);  
     }  
     if ((codec && avctx->codec && codec != avctx->codec)) {  
         av_log(avctx, AV_LOG_ERROR, "This AVCodecContext was allocated for %s, "  
                "but %s passed to avcodec_open2().\n", avctx->codec->name, codec->name);  
         return AVERROR(EINVAL);  
     }  
     if (!codec)  
         codec = avctx->codec;  
   
     if (avctx->extradata_size < 0 || avctx->extradata_size >= FF_MAX_EXTRADATA_SIZE)  
         return AVERROR(EINVAL);  
   
     if (options)  
         av_dict_copy(&tmp, *options, 0);  
   
     /* If there is a user-supplied mutex locking routine, call it. */  
     if (ff_lockmgr_cb) {  
         if ((*ff_lockmgr_cb)(&codec_mutex, AV_LOCK_OBTAIN))  
             return -1;  
     }  
   
     entangled_thread_counter++;  
     if(entangled_thread_counter != 1){  
         av_log(avctx, AV_LOG_ERROR, "insufficient thread locking around avcodec_open/close()\n");  
         ret = -1;  
         goto end;  
     }  
   
     avctx->internal = av_mallocz(sizeof(AVCodecInternal));  
     if (!avctx->internal) {  
         ret = AVERROR(ENOMEM);  
         goto end;  
     }  
   
     if (codec->priv_data_size > 0) {  
       if(!avctx->priv_data){  
         avctx->priv_data = av_mallocz(codec->priv_data_size);  
         if (!avctx->priv_data) {  
             ret = AVERROR(ENOMEM);  
             goto end;  
         }  
         if (codec->priv_class) {  
             *(const AVClass**)avctx->priv_data= codec->priv_class;  
             av_opt_set_defaults(avctx->priv_data);  
         }  
       }  
       if (codec->priv_class && (ret = av_opt_set_dict(avctx->priv_data, &tmp)) < 0)  
           goto free_and_end;  
     } else {  
         avctx->priv_data = NULL;  
     }  
     if ((ret = av_opt_set_dict(avctx, &tmp)) < 0)  
         goto free_and_end;  
   
     if (codec->capabilities & CODEC_CAP_EXPERIMENTAL)  
         if (avctx->strict_std_compliance > FF_COMPLIANCE_EXPERIMENTAL) {  
             av_log(avctx, AV_LOG_ERROR, "Codec is experimental but experimental codecs are not enabled, try -strict -2\n");  
             ret = -1;  
             goto free_and_end;  
         }  
   
     //We only call avcodec_set_dimensions() for non h264 codecs so as not to overwrite previously setup dimensions  
     if(!( avctx->coded_width && avctx->coded_height && avctx->width && avctx->height && avctx->codec_id == AV_CODEC_ID_H264)){  
     if(avctx->coded_width && avctx->coded_height)  
         avcodec_set_dimensions(avctx, avctx->coded_width, avctx->coded_height);  
     else if(avctx->width && avctx->height)  
         avcodec_set_dimensions(avctx, avctx->width, avctx->height);  
     }  
   
     if ((avctx->coded_width || avctx->coded_height || avctx->width || avctx->height)  
         && (  av_image_check_size(avctx->coded_width, avctx->coded_height, 0, avctx) < 0  
            || av_image_check_size(avctx->width,       avctx->height,       0, avctx) < 0)) {  
         av_log(avctx, AV_LOG_WARNING, "ignoring invalid width/height values\n");  
         avcodec_set_dimensions(avctx, 0, 0);  
     }  
   
     /* if the decoder init function was already called previously, 
        free the already allocated subtitle_header before overwriting it */  
     if (av_codec_is_decoder(codec))  
         av_freep(&avctx->subtitle_header);  
   
 #define SANE_NB_CHANNELS 128U  
     if (avctx->channels > SANE_NB_CHANNELS) {  
         ret = AVERROR(EINVAL);  
         goto free_and_end;  
     }  
   
     avctx->codec = codec;  
     if ((avctx->codec_type == AVMEDIA_TYPE_UNKNOWN || avctx->codec_type == codec->type) &&  
         avctx->codec_id == AV_CODEC_ID_NONE) {  
         avctx->codec_type = codec->type;  
         avctx->codec_id   = codec->id;  
     }  
     if (avctx->codec_id != codec->id || (avctx->codec_type != codec->type  
                            && avctx->codec_type != AVMEDIA_TYPE_ATTACHMENT)) {  
         av_log(avctx, AV_LOG_ERROR, "codec type or id mismatches\n");  
         ret = AVERROR(EINVAL);  
         goto free_and_end;  
     }  
     avctx->frame_number = 0;  
     avctx->codec_descriptor = avcodec_descriptor_get(avctx->codec_id);  
   
     if (avctx->codec_type == AVMEDIA_TYPE_AUDIO &&  
         (!avctx->time_base.num || !avctx->time_base.den)) {  
         avctx->time_base.num = 1;  
         avctx->time_base.den = avctx->sample_rate;  
     }  
   
     if (!HAVE_THREADS)  
         av_log(avctx, AV_LOG_WARNING, "Warning: not compiled with thread support, using thread emulation\n");  
   
     if (HAVE_THREADS) {  
         entangled_thread_counter--; //we will instanciate a few encoders thus kick the counter to prevent false detection of a problem  
         ret = ff_frame_thread_encoder_init(avctx, options ? *options : NULL);  
         entangled_thread_counter++;  
         if (ret < 0)  
             goto free_and_end;  
     }  
   
     if (HAVE_THREADS && !avctx->thread_opaque  
         && !(avctx->internal->frame_thread_encoder && (avctx->active_thread_type&FF_THREAD_FRAME))) {  
         ret = ff_thread_init(avctx);  
         if (ret < 0) {  
             goto free_and_end;  
         }  
     }  
     if (!HAVE_THREADS && !(codec->capabilities & CODEC_CAP_AUTO_THREADS))  
         avctx->thread_count = 1;  
   
     if (avctx->codec->max_lowres < avctx->lowres || avctx->lowres < 0) {  
         av_log(avctx, AV_LOG_ERROR, "The maximum value for lowres supported by the decoder is %d\n",  
                avctx->codec->max_lowres);  
         ret = AVERROR(EINVAL);  
         goto free_and_end;  
     }  
   
     if (av_codec_is_encoder(avctx->codec)) {  
         int i;  
         if (avctx->codec->sample_fmts) {  
             for (i = 0; avctx->codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; i++)  
                 if (avctx->sample_fmt == avctx->codec->sample_fmts[i])  
                     break;  
             if (avctx->codec->sample_fmts[i] == AV_SAMPLE_FMT_NONE) {  
                 av_log(avctx, AV_LOG_ERROR, "Specified sample_fmt is not supported.\n");  
                 ret = AVERROR(EINVAL);  
                 goto free_and_end;  
             }  
         }  
         if (avctx->codec->pix_fmts) {  
             for (i = 0; avctx->codec->pix_fmts[i] != PIX_FMT_NONE; i++)  
                 if (avctx->pix_fmt == avctx->codec->pix_fmts[i])  
                     break;  
             if (avctx->codec->pix_fmts[i] == PIX_FMT_NONE  
                 && !((avctx->codec_id == AV_CODEC_ID_MJPEG || avctx->codec_id == AV_CODEC_ID_LJPEG)  
                      && avctx->strict_std_compliance <= FF_COMPLIANCE_UNOFFICIAL)) {  
                 av_log(avctx, AV_LOG_ERROR, "Specified pix_fmt is not supported\n");  
                 ret = AVERROR(EINVAL);  
                 goto free_and_end;  
             }  
         }  
         if (avctx->codec->supported_samplerates) {  
             for (i = 0; avctx->codec->supported_samplerates[i] != 0; i++)  
                 if (avctx->sample_rate == avctx->codec->supported_samplerates[i])  
                     break;  
             if (avctx->codec->supported_samplerates[i] == 0) {  
                 av_log(avctx, AV_LOG_ERROR, "Specified sample_rate is not supported\n");  
                 ret = AVERROR(EINVAL);  
                 goto free_and_end;  
             }  
         }  
         if (avctx->codec->channel_layouts) {  
             if (!avctx->channel_layout) {  
                 av_log(avctx, AV_LOG_WARNING, "channel_layout not specified\n");  
             } else {  
                 for (i = 0; avctx->codec->channel_layouts[i] != 0; i++)  
                     if (avctx->channel_layout == avctx->codec->channel_layouts[i])  
                         break;  
                 if (avctx->codec->channel_layouts[i] == 0) {  
                     av_log(avctx, AV_LOG_ERROR, "Specified channel_layout is not supported\n");  
                     ret = AVERROR(EINVAL);  
                     goto free_and_end;  
                 }  
             }  
         }  
         if (avctx->channel_layout && avctx->channels) {  
             if (av_get_channel_layout_nb_channels(avctx->channel_layout) != avctx->channels) {  
                 av_log(avctx, AV_LOG_ERROR, "channel layout does not match number of channels\n");  
                 ret = AVERROR(EINVAL);  
                 goto free_and_end;  
             }  
         } else if (avctx->channel_layout) {  
             avctx->channels = av_get_channel_layout_nb_channels(avctx->channel_layout);  
         }  
     }  
   
     avctx->pts_correction_num_faulty_pts =  
     avctx->pts_correction_num_faulty_dts = 0;  
     avctx->pts_correction_last_pts =  
     avctx->pts_correction_last_dts = INT64_MIN;  
   
 "color:#ff6666;">    ////////////////////////////////////////////////////////////////////////////////////////////////  
     // 这里会调用编码器的中指定的初始化函数init, 对于x264编码器，也就是调用ff_libx264_encoder中指定的X264_init  
     if(avctx->codec->init && (!(avctx->active_thread_type&FF_THREAD_FRAME) || avctx->internal->frame_thread_encoder)){  
         ret = avctx->codec->init(avctx);  
         if (ret < 0) {  
             goto free_and_end;  
         }  
     }  
     ////////////////////////////////////////////////////////////////////////////////////////////////  
   
     ret=0;  
   
     if (av_codec_is_decoder(avctx->codec)) {  
         if (!avctx->bit_rate)  
             avctx->bit_rate = get_bit_rate(avctx);  
         /* validate channel layout from the decoder */  
         if (avctx->channel_layout &&  
             av_get_channel_layout_nb_channels(avctx->channel_layout) != avctx->channels) {  
             av_log(avctx, AV_LOG_WARNING, "channel layout does not match number of channels\n");  
             avctx->channel_layout = 0;  
         }  
     }  
 end:  
     entangled_thread_counter--;  
   
     /* Release any user-supplied mutex. */  
     if (ff_lockmgr_cb) {  
         (*ff_lockmgr_cb)(&codec_mutex, AV_LOCK_RELEASE);  
     }  
     if (options) {  
         av_dict_free(options);  
         *options = tmp;  
     }  
   
     return ret;  
 free_and_end:  
     av_dict_free(&tmp);  
     av_freep(&avctx->priv_data);  
     av_freep(&avctx->internal);  
     avctx->codec= NULL;  
     goto end;  
 }  

看看我们在代码中标注的那几行代码：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">if(avctx->codec->init && (!(avctx->active_thread_type&FF_THREAD_FRAME) || avctx->internal->frame_thread_encoder)){  
         ret = avctx->codec->init(avctx);  
         if (ret < 0) {  
             goto free_and_end;  
         }  
     }  

这里如果codec的init成员指定了对codec的初始化函数时，它会调用该初始化函数，通过前面的分析我们知道，X264编码器的初始化函数指定为X264_init，该函数的参数即是我们给定的AVCodecContext，下面我们来看看X264_init做了些什么。

X264编码器的初始化，X264_init

首先列出源代码：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">static av_cold int X264_init(AVCodecContext *avctx)  
 {  
     X264Context *x4 = avctx->priv_data;  
     int sw,sh;  
   
     x264_param_default(&x4->params);  
   
     x4->params.b_deblocking_filter         = avctx->flags & CODEC_FLAG_LOOP_FILTER;  
   
     x4->params.rc.f_ip_factor             = 1 / fabs(avctx->i_quant_factor);  
     x4->params.rc.f_pb_factor             = avctx->b_quant_factor;  
     x4->params.analyse.i_chroma_qp_offset = avctx->chromaoffset;  
     if (x4->preset || x4->tune)  
   
 "color:#ff6666;">        ////////////////////////////////////////////////////////////////////////////////////////  
         // 在这里面会设置很多关键的参数，这个函数式X264提供的，接下来我们要到X264中查看其源代码  
         if (x264_param_default_preset(&x4->params, x4->preset, x4->tune) < 0) {  
             int i;  
             av_log(avctx, AV_LOG_ERROR, "Error setting preset/tune %s/%s.\n", x4->preset, x4->tune);  
             av_log(avctx, AV_LOG_INFO, "Possible presets:");  
             for (i = 0; x264_preset_names[i]; i++)  
                 av_log(avctx, AV_LOG_INFO, " %s", x264_preset_names[i]);  
             av_log(avctx, AV_LOG_INFO, "\n");  
             av_log(avctx, AV_LOG_INFO, "Possible tunes:");  
             for (i = 0; x264_tune_names[i]; i++)  
                 av_log(avctx, AV_LOG_INFO, " %s", x264_tune_names[i]);  
             av_log(avctx, AV_LOG_INFO, "\n");  
             return AVERROR(EINVAL);  
         }  
         /////////////////////////////////////////////////////////////////////////////////////////  
   
     if (avctx->level > 0)  
         x4->params.i_level_idc = avctx->level;  
   
     x4->params.pf_log               = X264_log;  
     x4->params.p_log_private        = avctx;  
     x4->params.i_log_level          = X264_LOG_DEBUG;  
     x4->params.i_csp                = convert_pix_fmt(avctx->pix_fmt);  
   
     OPT_STR("weightp", x4->wpredp);  
   
     if (avctx->bit_rate) {  
         x4->params.rc.i_bitrate   = avctx->bit_rate / 1000;  
         x4->params.rc.i_rc_method = X264_RC_ABR;  
     }  
     x4->params.rc.i_vbv_buffer_size = avctx->rc_buffer_size / 1000;  
     x4->params.rc.i_vbv_max_bitrate = avctx->rc_max_rate    / 1000;  
     x4->params.rc.b_stat_write      = avctx->flags & CODEC_FLAG_PASS1;  
     if (avctx->flags & CODEC_FLAG_PASS2) {  
         x4->params.rc.b_stat_read = 1;  
     } else {  
         if (x4->crf >= 0) {  
             x4->params.rc.i_rc_method   = X264_RC_CRF;  
             x4->params.rc.f_rf_constant = x4->crf;  
         } else if (x4->cqp >= 0) {  
             x4->params.rc.i_rc_method   = X264_RC_CQP;  
             x4->params.rc.i_qp_constant = x4->cqp;  
         }  
   
         if (x4->crf_max >= 0)  
             x4->params.rc.f_rf_constant_max = x4->crf_max;  
     }  
   
     if (avctx->rc_buffer_size && avctx->rc_initial_buffer_occupancy &&  
         (avctx->rc_initial_buffer_occupancy <= avctx->rc_buffer_size)) {  
         x4->params.rc.f_vbv_buffer_init =  
             (float)avctx->rc_initial_buffer_occupancy / avctx->rc_buffer_size;  
     }  
   
     OPT_STR("level", x4->level);  
   
     if(x4->x264opts){  
         const char *p= x4->x264opts;  
         while(p){  
             char param[256]={0}, val[256]={0};  
             if(sscanf(p, "%255[^:=]=%255[^:]", param, val) == 1){  
                 OPT_STR(param, "1");  
             }else  
                 OPT_STR(param, val);  
             p= strchr(p, ':');  
             p+=!!p;  
         }  
     }  
   
     if (avctx->me_method == ME_EPZS)  
         x4->params.analyse.i_me_method = X264_ME_DIA;  
     else if (avctx->me_method == ME_HEX)  
         x4->params.analyse.i_me_method = X264_ME_HEX;  
     else if (avctx->me_method == ME_UMH)  
         x4->params.analyse.i_me_method = X264_ME_UMH;  
     else if (avctx->me_method == ME_FULL)  
         x4->params.analyse.i_me_method = X264_ME_ESA;  
     else if (avctx->me_method == ME_TESA)  
         x4->params.analyse.i_me_method = X264_ME_TESA;  
   
     if (avctx->gop_size >= 0)  
         x4->params.i_keyint_max         = avctx->gop_size;  
     if (avctx->max_b_frames >= 0)  
         x4->params.i_bframe             = avctx->max_b_frames;  
     if (avctx->scenechange_threshold >= 0)  
         x4->params.i_scenecut_threshold = avctx->scenechange_threshold;  
     if (avctx->qmin >= 0)  
         x4->params.rc.i_qp_min          = avctx->qmin;  
     if (avctx->qmax >= 0)  
         x4->params.rc.i_qp_max          = avctx->qmax;  
     if (avctx->max_qdiff >= 0)  
         x4->params.rc.i_qp_step         = avctx->max_qdiff;  
     if (avctx->qblur >= 0)  
         x4->params.rc.f_qblur           = avctx->qblur;     /* temporally blur quants */  
     if (avctx->qcompress >= 0)  
         x4->params.rc.f_qcompress       = avctx->qcompress; /* 0.0 => cbr, 1.0 => constant qp */  
     if (avctx->refs >= 0)  
         x4->params.i_frame_reference    = avctx->refs;  
     if (avctx->trellis >= 0)  
         x4->params.analyse.i_trellis    = avctx->trellis;  
     if (avctx->me_range >= 0)  
         x4->params.analyse.i_me_range   = avctx->me_range;  
     if (avctx->noise_reduction >= 0)  
         x4->params.analyse.i_noise_reduction = avctx->noise_reduction;  
     if (avctx->me_subpel_quality >= 0)  
         x4->params.analyse.i_subpel_refine   = avctx->me_subpel_quality;  
     if (avctx->b_frame_strategy >= 0)  
         x4->params.i_bframe_adaptive = avctx->b_frame_strategy;  
     if (avctx->keyint_min >= 0)  
         x4->params.i_keyint_min = avctx->keyint_min;  
     if (avctx->coder_type >= 0)  
         x4->params.b_cabac = avctx->coder_type == FF_CODER_TYPE_AC;  
     if (avctx->me_cmp >= 0)  
         x4->params.analyse.b_chroma_me = avctx->me_cmp & FF_CMP_CHROMA;  
   
     if (x4->aq_mode >= 0)  
         x4->params.rc.i_aq_mode = x4->aq_mode;  
     if (x4->aq_strength >= 0)  
         x4->params.rc.f_aq_strength = x4->aq_strength;  
     PARSE_X264_OPT("psy-rd", psy_rd);  
     PARSE_X264_OPT("deblock", deblock);  
     PARSE_X264_OPT("partitions", partitions);  
     PARSE_X264_OPT("stats", stats);  
     if (x4->psy >= 0)  
         x4->params.analyse.b_psy  = x4->psy;  
     if (x4->rc_lookahead >= 0)  
         x4->params.rc.i_lookahead = x4->rc_lookahead;  
     if (x4->weightp >= 0)  
         x4->params.analyse.i_weighted_pred = x4->weightp;  
     if (x4->weightb >= 0)  
         x4->params.analyse.b_weighted_bipred = x4->weightb;  
     if (x4->cplxblur >= 0)  
         x4->params.rc.f_complexity_blur = x4->cplxblur;  
   
     if (x4->ssim >= 0)  
         x4->params.analyse.b_ssim = x4->ssim;  
     if (x4->intra_refresh >= 0)  
         x4->params.b_intra_refresh = x4->intra_refresh;  
     if (x4->b_bias != INT_MIN)  
         x4->params.i_bframe_bias              = x4->b_bias;  
     if (x4->b_pyramid >= 0)  
         x4->params.i_bframe_pyramid = x4->b_pyramid;  
     if (x4->mixed_refs >= 0)  
         x4->params.analyse.b_mixed_references = x4->mixed_refs;  
     if (x4->dct8x8 >= 0)  
         x4->params.analyse.b_transform_8x8    = x4->dct8x8;  
     if (x4->fast_pskip >= 0)  
         x4->params.analyse.b_fast_pskip       = x4->fast_pskip;  
     if (x4->aud >= 0)  
         x4->params.b_aud                      = x4->aud;  
     if (x4->mbtree >= 0)  
         x4->params.rc.b_mb_tree               = x4->mbtree;  
     if (x4->direct_pred >= 0)  
         x4->params.analyse.i_direct_mv_pred   = x4->direct_pred;  
   
     if (x4->slice_max_size >= 0)  
         x4->params.i_slice_max_size =  x4->slice_max_size;  
   
     if (x4->fastfirstpass)  
         x264_param_apply_fastfirstpass(&x4->params);  
   
     if (x4->profile)  
         if (x264_param_apply_profile(&x4->params, x4->profile) < 0) {  
             int i;  
             av_log(avctx, AV_LOG_ERROR, "Error setting profile %s.\n", x4->profile);  
             av_log(avctx, AV_LOG_INFO, "Possible profiles:");  
             for (i = 0; x264_profile_names[i]; i++)  
                 av_log(avctx, AV_LOG_INFO, " %s", x264_profile_names[i]);  
             av_log(avctx, AV_LOG_INFO, "\n");  
             return AVERROR(EINVAL);  
         }  
   
     x4->params.i_width          = avctx->width;  
     x4->params.i_height         = avctx->height;  
     av_reduce(&sw, &sh, avctx->sample_aspect_ratio.num, avctx->sample_aspect_ratio.den, 4096);  
     x4->params.vui.i_sar_width  = sw;  
     x4->params.vui.i_sar_height = sh;  
     x4->params.i_fps_num = x4->params.i_timebase_den = avctx->time_base.den;  
     x4->params.i_fps_den = x4->params.i_timebase_num = avctx->time_base.num;  
   
     x4->params.analyse.b_psnr = avctx->flags & CODEC_FLAG_PSNR;  
   
     x4->params.i_threads      = avctx->thread_count;  
     if (avctx->thread_type)  
         x4->params.b_sliced_threads = avctx->thread_type == FF_THREAD_SLICE;  
   
     x4->params.b_interlaced   = avctx->flags & CODEC_FLAG_INTERLACED_DCT;  
   
 //    x4->params.b_open_gop     = !(avctx->flags & CODEC_FLAG_CLOSED_GOP);  
   
     x4->params.i_slice_count  = avctx->slices;  
   
     x4->params.vui.b_fullrange = avctx->pix_fmt == PIX_FMT_YUVJ420P;  
   
     if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER)  
         x4->params.b_repeat_headers = 0;  
   
     // update AVCodecContext with x264 parameters  
     avctx->has_b_frames = x4->params.i_bframe ?  
         x4->params.i_bframe_pyramid ? 2 : 1 : 0;  
     if (avctx->max_b_frames < 0)  
         avctx->max_b_frames = 0;  
   
     avctx->bit_rate = x4->params.rc.i_bitrate*1000;  
     x4->enc = x264_encoder_open(&x4->params);  
     if (!x4->enc)  
         return -1;  
   
     avctx->coded_frame = &x4->out_pic;  
   
     if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER) {  
         x264_nal_t *nal;  
         uint8_t *p;  
         int nnal, s, i;  
   
         s = x264_encoder_headers(x4->enc, &nal, &nnal);  
         avctx->extradata = p = av_malloc(s);  
   
         for (i = 0; i < nnal; i++) {  
             /* Don't put the SEI in extradata. */  
             if (nal[i].i_type == NAL_SEI) {  
                 av_log(avctx, AV_LOG_INFO, "%s\n", nal[i].p_payload+25);  
                 x4->sei_size = nal[i].i_payload;  
                 x4->sei      = av_malloc(x4->sei_size);  
                 memcpy(x4->sei, nal[i].p_payload, nal[i].i_payload);  
                 continue;  
             }  
             memcpy(p, nal[i].p_payload, nal[i].i_payload);  
             p += nal[i].i_payload;  
         }  
         avctx->extradata_size = p - avctx->extradata;  
     }  
   
     return 0;  
 }  
   

看看我们做出标记的那几行代码，这里它调用了x264_param_default_preset(&x4->params, x4->preset, x4->tune)，所以我们接下来当然是看看这个函数了。

对编码器参数的设置，x264_param_default_preset

这个函数的定义并不在ffmpeg中，因为这是X264提供给外界对编码器做设置API函数，于是我们在X264项目中查找该函数，它定义在Common.c中，代码如下：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">int x264_param_default_preset( x264_param_t *param, const char *preset, const char *tune )  
 {  
     x264_param_default( param );  
   
     if( preset && "color:#ff6666;">x264_param_apply_preset( param, preset ) < 0 )  
         return -1;  
     if( tune && "color:#ff6666;">x264_param_apply_tune( param, tune ) < 0 )  
         return -1;  
     return 0;  
 }  

它首先调用下x264_param_default设置默认参数，这在用户没有指定额外设置时，设置就是使用该函数默认参数，但如果用户指定了preset和(或者)tune参数时，它就会进行额外参数的设置。

首先看一下应用模式的设置：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">static int x264_param_apply_preset( x264_param_t *param, const char *preset )  
 {  
     char *end;  
     int i = strtol( preset, &end, 10 );  
     if( *end == 0 && i >= 0 && i < sizeof(x264_preset_names)/sizeof(*x264_preset_names)-1 )  
         preset = x264_preset_names[i];  
   
     if( !strcasecmp( preset, "ultrafast" ) )  
     {  
         param->i_frame_reference = 1;  
         param->i_scenecut_threshold = 0;  
         param->b_deblocking_filter = 0;  
         param->b_cabac = 0;  
         param->i_bframe = 0;  
         param->analyse.intra = 0;  
         param->analyse.inter = 0;  
         param->analyse.b_transform_8x8 = 0;  
         param->analyse.i_me_method = X264_ME_DIA;  
         param->analyse.i_subpel_refine = 0;  
         param->rc.i_aq_mode = 0;  
         param->analyse.b_mixed_references = 0;  
         param->analyse.i_trellis = 0;  
         param->i_bframe_adaptive = X264_B_ADAPT_NONE;  
         param->rc.b_mb_tree = 0;  
         param->analyse.i_weighted_pred = X264_WEIGHTP_NONE;  
         param->analyse.b_weighted_bipred = 0;  
         param->rc.i_lookahead = 0;  
     }  
     else if( !strcasecmp( preset, "superfast" ) )  
     {  
         param->analyse.inter = X264_ANALYSE_I8x8|X264_ANALYSE_I4x4;  
         param->analyse.i_me_method = X264_ME_DIA;  
         param->analyse.i_subpel_refine = 1;  
         param->i_frame_reference = 1;  
         param->analyse.b_mixed_references = 0;  
         param->analyse.i_trellis = 0;  
         param->rc.b_mb_tree = 0;  
         param->analyse.i_weighted_pred = X264_WEIGHTP_SIMPLE;  
         param->rc.i_lookahead = 0;  
     }  
     else if( !strcasecmp( preset, "veryfast" ) )  
     {  
         param->analyse.i_me_method = X264_ME_HEX;  
         param->analyse.i_subpel_refine = 2;  
         param->i_frame_reference = 1;  
         param->analyse.b_mixed_references = 0;  
         param->analyse.i_trellis = 0;  
         param->analyse.i_weighted_pred = X264_WEIGHTP_SIMPLE;  
         param->rc.i_lookahead = 10;  
     }  
     else if( !strcasecmp( preset, "faster" ) )  
     {  
         param->analyse.b_mixed_references = 0;  
         param->i_frame_reference = 2;  
         param->analyse.i_subpel_refine = 4;  
         param->analyse.i_weighted_pred = X264_WEIGHTP_SIMPLE;  
         param->rc.i_lookahead = 20;  
     }  
     else if( !strcasecmp( preset, "fast" ) )  
     {  
         param->i_frame_reference = 2;  
         param->analyse.i_subpel_refine = 6;  
         param->analyse.i_weighted_pred = X264_WEIGHTP_SIMPLE;  
         param->rc.i_lookahead = 30;  
     }  
     else if( !strcasecmp( preset, "medium" ) )  
     {  
         /* Default is medium */  
     }  
     else if( !strcasecmp( preset, "slow" ) )  
     {  
         param->analyse.i_me_method = X264_ME_UMH;  
         param->analyse.i_subpel_refine = 8;  
         param->i_frame_reference = 5;  
         param->i_bframe_adaptive = X264_B_ADAPT_TRELLIS;  
         param->analyse.i_direct_mv_pred = X264_DIRECT_PRED_AUTO;  
         param->rc.i_lookahead = 50;  
     }  
     else if( !strcasecmp( preset, "slower" ) )  
     {  
         param->analyse.i_me_method = X264_ME_UMH;  
         param->analyse.i_subpel_refine = 9;  
         param->i_frame_reference = 8;  
         param->i_bframe_adaptive = X264_B_ADAPT_TRELLIS;  
         param->analyse.i_direct_mv_pred = X264_DIRECT_PRED_AUTO;  
         param->analyse.inter |= X264_ANALYSE_PSUB8x8;  
         param->analyse.i_trellis = 2;  
         param->rc.i_lookahead = 60;  
     }  
     else if( !strcasecmp( preset, "veryslow" ) )  
     {  
         param->analyse.i_me_method = X264_ME_UMH;  
         param->analyse.i_subpel_refine = 10;  
         param->analyse.i_me_range = 24;  
         param->i_frame_reference = 16;  
         param->i_bframe_adaptive = X264_B_ADAPT_TRELLIS;  
         param->analyse.i_direct_mv_pred = X264_DIRECT_PRED_AUTO;  
         param->analyse.inter |= X264_ANALYSE_PSUB8x8;  
         param->analyse.i_trellis = 2;  
         param->i_bframe = 8;  
         param->rc.i_lookahead = 60;  
     }  
     else if( !strcasecmp( preset, "placebo" ) )  
     {  
         param->analyse.i_me_method = X264_ME_TESA;  
         param->analyse.i_subpel_refine = 11;  
         param->analyse.i_me_range = 24;  
         param->i_frame_reference = 16;  
         param->i_bframe_adaptive = X264_B_ADAPT_TRELLIS;  
         param->analyse.i_direct_mv_pred = X264_DIRECT_PRED_AUTO;  
         param->analyse.inter |= X264_ANALYSE_PSUB8x8;  
         param->analyse.b_fast_pskip = 0;  
         param->analyse.i_trellis = 2;  
         param->i_bframe = 16;  
         param->rc.i_lookahead = 60;  
     }  
     else  
     {  
         x264_log( NULL, X264_LOG_ERROR, "invalid preset '%s'\n", preset );  
         return -1;  
     }  
     return 0;  
 }  

这里定义了几种模式供用户选择，经过测试，这些模式是会影响到编码的延迟时间的，越快的模式，其延迟越小，对于"ultralfast"模式，我们发现延迟帧减少了许多，同时发现越快的模式相对于其他模式会有些花屏，但此时我发现所有模式都没有使得延迟为0的情况（此时我是直接修改源代码来固定设置为特定模式的，后面我们会讲到如何通过ffmpeg中的API来设置），于是我将希望寄托于下面的x264_param_apply_tune，我感觉这可能是我最后的救命稻草了！下面我们来看一下这个函数的源代码：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">static int x264_param_apply_tune( x264_param_t *param, const char *tune )  
 {  
     char *tmp = x264_malloc( strlen( tune ) + 1 );  
     if( !tmp )  
         return -1;  
     tmp = strcpy( tmp, tune );  
     char *s = strtok( tmp, ",./-+" );  
     int psy_tuning_used = 0;  
     while( s )  
     {  
         if( !strncasecmp( s, "film", 4 ) )  
         {  
             if( psy_tuning_used++ ) goto psy_failure;  
             param->i_deblocking_filter_alphac0 = -1;  
             param->i_deblocking_filter_beta = -1;  
             param->analyse.f_psy_trellis = 0.15;  
         }  
         else if( !strncasecmp( s, "animation", 9 ) )  
         {  
             if( psy_tuning_used++ ) goto psy_failure;  
             param->i_frame_reference = param->i_frame_reference > 1 ? param->i_frame_reference*2 : 1;  
             param->i_deblocking_filter_alphac0 = 1;  
             param->i_deblocking_filter_beta = 1;  
             param->analyse.f_psy_rd = 0.4;  
             param->rc.f_aq_strength = 0.6;  
             param->i_bframe += 2;  
         }  
         else if( !strncasecmp( s, "grain", 5 ) )  
         {  
             if( psy_tuning_used++ ) goto psy_failure;  
             param->i_deblocking_filter_alphac0 = -2;  
             param->i_deblocking_filter_beta = -2;  
             param->analyse.f_psy_trellis = 0.25;  
             param->analyse.b_dct_decimate = 0;  
             param->rc.f_pb_factor = 1.1;  
             param->rc.f_ip_factor = 1.1;  
             param->rc.f_aq_strength = 0.5;  
             param->analyse.i_luma_deadzone[0] = 6;  
             param->analyse.i_luma_deadzone[1] = 6;  
             param->rc.f_qcompress = 0.8;  
         }  
         else if( !strncasecmp( s, "stillimage", 5 ) )  
         {  
             if( psy_tuning_used++ ) goto psy_failure;  
             param->i_deblocking_filter_alphac0 = -3;  
             param->i_deblocking_filter_beta = -3;  
             param->analyse.f_psy_rd = 2.0;  
             param->analyse.f_psy_trellis = 0.7;  
             param->rc.f_aq_strength = 1.2;  
         }  
         else if( !strncasecmp( s, "psnr", 4 ) )  
         {  
             if( psy_tuning_used++ ) goto psy_failure;  
             param->rc.i_aq_mode = X264_AQ_NONE;  
             param->analyse.b_psy = 0;  
         }  
         else if( !strncasecmp( s, "ssim", 4 ) )  
         {  
             if( psy_tuning_used++ ) goto psy_failure;  
             param->rc.i_aq_mode = X264_AQ_AUTOVARIANCE;  
             param->analyse.b_psy = 0;  
         }  
         else if( !strncasecmp( s, "fastdecode", 10 ) )  
         {  
             param->b_deblocking_filter = 0;  
             param->b_cabac = 0;  
             param->analyse.b_weighted_bipred = 0;  
             param->analyse.i_weighted_pred = X264_WEIGHTP_NONE;  
         }  
         "color:#ff6666;">else if( !strncasecmp( s, "zerolatency", 11 ) )  
         {  
             param->rc.i_lookahead = 0;  
             param->i_sync_lookahead = 0;  
             param->i_bframe = 0;  
             param->b_sliced_threads = 1;  
             param->b_vfr_input = 0;  
             param->rc.b_mb_tree = 0;  
         }  
         else if( !strncasecmp( s, "touhou", 6 ) )  
         {  
             if( psy_tuning_used++ ) goto psy_failure;  
             param->i_frame_reference = param->i_frame_reference > 1 ? param->i_frame_reference*2 : 1;  
             param->i_deblocking_filter_alphac0 = -1;  
             param->i_deblocking_filter_beta = -1;  
             param->analyse.f_psy_trellis = 0.2;  
             param->rc.f_aq_strength = 1.3;  
             if( param->analyse.inter & X264_ANALYSE_PSUB16x16 )  
                 param->analyse.inter |= X264_ANALYSE_PSUB8x8;  
         }  
         else  
         {  
             x264_log( NULL, X264_LOG_ERROR, "invalid tune '%s'\n", s );  
             x264_free( tmp );  
             return -1;  
         }  
         if( 0 )  
         {  
     psy_failure:  
             x264_log( NULL, X264_LOG_WARNING, "only 1 psy tuning can be used: ignoring tune %s\n", s );  
         }  
         s = strtok( NULL, ",./-+" );  
     }  
     x264_free( tmp );  
     return 0;  
 }  

我们在代码中也看到了有几种模式供选择，每种模式都是对一些参数的具体设置，当然这些参数的意义我也不是很清楚，有待后面继续的研究，但我却惊喜地发现了一个“zerolatency”模式，这不就是我要找的实时编码模式吗，至少从字面上来讲是！于是修改源代码写死为“zerolatency”模式，编译、运行，我的天哪，终于找到了！

另外，我了解到，其实在工程编译出的可执行文件运行时也是可以指定这些运行参数的，这更加证实了我的想法。于是我得出了一个结论：

x264_param_apply_preset和x264_param_apply_tune的参数决定了编码器的全部运作方式（当然包括是否编码延迟，以及延迟多长）！

如何不修改ffmpeg或者x264工程源代码来达到实时编码

知道了影响编码延迟的原因后，我们又要上溯到ffmpeg中的X264_init代码中去了，看看该函数是如何指定x264_param_default_preset函数的参数的，为了便于讲解，我们再次列出部分代码：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">static av_cold int X264_init(AVCodecContext *avctx)  
 {  
     X264Context *x4 = avctx->priv_data;  
     int sw,sh;  
   
     x264_param_default(&x4->params);  
   
     x4->params.b_deblocking_filter         = avctx->flags & CODEC_FLAG_LOOP_FILTER;  
   
     x4->params.rc.f_ip_factor             = 1 / fabs(avctx->i_quant_factor);  
     x4->params.rc.f_pb_factor             = avctx->b_quant_factor;  
     x4->params.analyse.i_chroma_qp_offset = avctx->chromaoffset;  
     if (x4->preset || x4->tune)  
         "color:#ff6666;">/////////////////////////////////////////////////////////////////////////////////////////  
         // 主要看看这个函数，在这里面会设置很多关键的参数，这个函数式X264提供的，接下来我们要到X264中查看其源代码  
         if (x264_param_default_preset(&x4->params, x4->preset, x4->tune) < 0) {  
             int i;  
             av_log(avctx, AV_LOG_ERROR, "Error setting preset/tune %s/%s.\n", x4->preset, x4->tune);  
             av_log(avctx, AV_LOG_INFO, "Possible presets:");  
             for (i = 0; x264_preset_names[i]; i++)  
                 av_log(avctx, AV_LOG_INFO, " %s", x264_preset_names[i]);  
             av_log(avctx, AV_LOG_INFO, "\n");  
             av_log(avctx, AV_LOG_INFO, "Possible tunes:");  
             for (i = 0; x264_tune_names[i]; i++)  
                 av_log(avctx, AV_LOG_INFO, " %s", x264_tune_names[i]);  
             av_log(avctx, AV_LOG_INFO, "\n");  
             return AVERROR(EINVAL);  
         }  
         ////////////////////////////////////////////////////////////////////////////////////////  
     ......  
     ......  
 }  

这里调用x264_param_default_preset(&x4->params, x4->preset, x4->tune) ，而x4变量的类型是X264Context ，这个结构体中的参数是最终要传给X264来设置编码器参数的，我们还可以从X264Context *x4 = avctx->priv_data;中看到，x4变量其实是有AVCodecContext中的priv_data成员指定的，在AVCodecContext中priv_data是void*类型，而AVCodecContext正是我们传进来的，也就是说，我们现在终于可以想办法控制这些参数了----这要把这些参数指定给priv_data成员即可了。

现在我们还是先看看X264Context 中那些成员指定了控制得到实时编码的的参数：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">typedef struct X264Context {  
     AVClass        *class;  
     x264_param_t    params;  
     x264_t         *enc;  
     x264_picture_t  pic;  
     uint8_t        *sei;  
     int             sei_size;  
     AVFrame         out_pic;  
     char *preset;  
     char *tune;  
     char *profile;  
     char *level;  
     int fastfirstpass;  
     char *wpredp;  
     char *x264opts;  
     float crf;  
     float crf_max;  
     int cqp;  
     int aq_mode;  
     float aq_strength;  
     char *psy_rd;  
     int psy;  
     int rc_lookahead;  
     int weightp;  
     int weightb;  
     int ssim;  
     int intra_refresh;  
     int b_bias;  
     int b_pyramid;  
     int mixed_refs;  
     int dct8x8;  
     int fast_pskip;  
     int aud;  
     int mbtree;  
     char *deblock;  
     float cplxblur;  
     char *partitions;  
     int direct_pred;  
     int slice_max_size;  
     char *stats;  
 } X264Context;  

出于本能，我第一时间发现了两个我最关心的两个参数：preset和tune，这正是(x264_param_default_preset要用到的两个参数。

至此，我认为已经想到了解决编码延迟的解决方案了（离完美还差那么一步），于是我立马在将测试代码中做出如下的修改：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">   ......    
    c = avcodec_alloc_context3(codec);  
   
     /* put sample parameters */  
     c->bit_rate = 400000;  
     /* resolution must be a multiple of two */  
     c->width = 800/*352*/;  
     c->height = 500/*288*/;  
     /* frames per second */  
     c->time_base.den = 1;  
     c->time_base.num = 25;  
     c->gop_size = 10; /* emit one intra frame every ten frames */  
     c->max_b_frames=1;  
     c->pix_fmt = PIX_FMT_YUV420P;  
   
     "color:#ff6666;">// 新增语句，设置为编码延迟  
     if (c->priv_data) {  
         ((X264Context*)(c->priv_data))->preset = "superfast";  
         ((X264Context*)(c->priv_data))->tune = "zerolatency";  
     }  
     ......  
     ......  

编译......error！原来编译器不认识X264Context，一定是忘了包含头文件，查看源代码，发现这是一个对外不公开的结构体，我无法通过包含头文件来包含该结构体，于是抱怨ffmpeg怎么搞的！也许是给予解决问题，同时验证之前的的理解正确与否，我采用了最粗暴的方法，直接将该结构体复制到我的文件中，当然这个结构体中有一个名为class的成员需要更改一下名字，因为我的项目是C++开发的，这个而class是C++的关键字，同时也要将x264.h和x264_config.h头文件复制到你的工程中，因为X264Context中的几个成员类型如x264_param_t、x264_t等是在x264.h中定义的，而x264.h又包含x264_config.h，好在x264_config.h没有在继续包含别的文件了（这也再次证明了我们在开发的一条规范的好处：尽量在头文件中不再包含其他头文件，而是尽量使用向前声明，这样方便代码的移植）。折腾一番之后，编译代码，终于顺利通过了，此时，正如我的想象一样，编码果然没有任何延迟了！（在我的工程代码中却是没有哪怕一帧的延迟，但在这个测试代码中却存在一帧的延迟，当然一帧的延迟几乎没有任何影响），见下图运行效果：

我的目的终于达到了，同时验证我的理解也是正确的，一时间海阔天空！

但欢呼胜利之后，我却看着自己定义的那个X264Context非常别扭，于是我想，ffmpeg不会肯定提供了其他的途径来设置我们想要的这些参数，而不至于用户自己手工去配置priv_data，要知道这是一个void*指针！而且ffmpeg并没有将X264Context开放给外部使用者，这让我更加怀疑我的设置方式是否合理？是否存在接口让我方便地设置priv_data?

让我欢喜的av_opt_set

带着对自己的怀疑，我继续查找资料，看源代码......终于我在一个官方的例子代码中发现了新大陆，在decoding_encdoing.cpp的视频编码例子（我的测试例子正是从该例子文件中提取出来的，见该文件中的video_encode_example函数）中，我发现了下面一条语句（其实以前看例子就看到过这条语句，但当时由于没有细细研究，也没有管它的用意何在）：

[cpp]  view plain copy 
      
     
 if(codec_id == AV_CODEC_ID_H264)   
         av_opt_set(c->priv_data, "preset", "slow", 0);  

于是赶紧查查看源代码：

[cpp]  view plain copy 
      
     
 int av_opt_set(void *obj, const char *name, const char *val, int search_flags)  
 {  
     int ret;  
     void *dst, *target_obj;  
     const AVOption *o = av_opt_find2(obj, name, NULL, 0, search_flags, &target_obj);  
     if (!o || !target_obj)  
         return AVERROR_OPTION_NOT_FOUND;  
     if (!val && (o->type != AV_OPT_TYPE_STRING && o->type != AV_OPT_TYPE_PIXEL_FMT && o->type != AV_OPT_TYPE_IMAGE_SIZE))  
         return AVERROR(EINVAL);  
   
     dst = ((uint8_t*)target_obj) + o->offset;  
     switch (o->type) {  
     case AV_OPT_TYPE_STRING:   return set_string(obj, o, val, dst);  
     case AV_OPT_TYPE_BINARY:   return set_string_binary(obj, o, val, dst);  
     case AV_OPT_TYPE_FLAGS:  
     case AV_OPT_TYPE_INT:  
     case AV_OPT_TYPE_INT64:  
     case AV_OPT_TYPE_FLOAT:  
     case AV_OPT_TYPE_DOUBLE:  
     case AV_OPT_TYPE_RATIONAL: return set_string_number(obj, o, val, dst);  
     case AV_OPT_TYPE_IMAGE_SIZE:  
         if (!val || !strcmp(val, "none")) {  
             *(int *)dst = *((int *)dst + 1) = 0;  
             return 0;  
         }  
         ret = av_parse_video_size(dst, ((int *)dst) + 1, val);  
         if (ret < 0)  
             av_log(obj, AV_LOG_ERROR, "Unable to parse option value \"%s\" as image size\n", val);  
         return ret;  
     case AV_OPT_TYPE_PIXEL_FMT:  
         if (!val || !strcmp(val, "none"))  
             ret = PIX_FMT_NONE;  
         else {  
             ret = av_get_pix_fmt(val);  
             if (ret == PIX_FMT_NONE) {  
                 char *tail;  
                 ret = strtol(val, &tail, 0);  
                 if (*tail || (unsigned)ret >= PIX_FMT_NB) {  
                     av_log(obj, AV_LOG_ERROR, "Unable to parse option value \"%s\" as pixel format\n", val);  
                     return AVERROR(EINVAL);  
                 }  
             }  
         }  
         *(enum PixelFormat *)dst = ret;  
         return 0;  
     }  
   
     av_log(obj, AV_LOG_ERROR, "Invalid option type.\n");  
     return AVERROR(EINVAL);  
 }  

果然不出我所料，就是它了！

于是迫不及待地重新修改我的测试代码，将原先的修改全删掉，修改为如下：

[cpp]  view plain copy 
      
     
 "font-family:Courier New;">    ......    
    c = avcodec_alloc_context3(codec);  
   
     /* put sample parameters */  
     c->bit_rate = 400000;  
     /* resolution must be a multiple of two */  
     c->width = 800/*352*/;  
     c->height = 500/*288*/;  
     /* frames per second */  
     c->time_base.den = 1;  
     c->time_base.num = 25;  
     c->gop_size = 10; /* emit one intra frame every ten frames */  
     c->max_b_frames=1;  
     c->pix_fmt = PIX_FMT_YUV420P;  
   
 "color:#ff6666;">    // 新增语句，设置为编码延迟  
     av_opt_set(c->priv_data, "preset", "superfast", 0);  
   
     // 实时编码关键看这句，上面那条无所谓  
     av_opt_set(c->priv_data, "tune", "zerolatency", 0);  
     ......  
     ......  

编译运行.......果然OK，见下图测试结果（在我的项目中没有延迟哪怕一帧，但这个例子代码中有一帧延迟，但一帧无伤大雅）：

困扰我两天的问题终于圆满解决了！万岁！

总结

我在想，如果我之前在网上或者别的什么地方看到了用av_op_set这样一条简单的语句就解决了我的问题，那么我节省了两天时间，但仅此而已，我也仅仅是知其然而不知其所以然。但在我在网上没有寻找到满意的答案之后，我决定自己阅读源代码，刨根问底，我花费了两天时间，但是换回的不仅仅是知道要这么做，也知道了为什么这样做可以有效果！

所以，开源项目对已我们每个IT从业人员都是一笔宝贵的财富，开源项目源代码的阅读是提高我们软件开发能力的一条最佳途径之一。

这篇文章记录了我阅读ffmpeg源代码解决问题的各个环节，以备后用，也希望我的这些文字可以给遇到同样问题的人提供一点点帮助。

最后列出一些我在解决这个问题中参看的一些网页：

http://bbs.csdn.net/topics/370233998

http://x264-settings.wikispaces.com/x264_Encoding_Suggestions

你可能感兴趣的:(FFMPEG)

python3+ffmpeg下载B站视频，附代码才华横溢吴道简爬虫 python windows
最近要去外面玩，旅途漫长，于是乎，就写了个代码，从B站上下载纪录片看，代码附后，请自取，如果觉得有用，麻烦点个赞，鼓励一下。感谢~~一、下载安装ffmpegFfmpeg是一款自由软件，用于视频和音频文件的处理，在本例中，我使用它进行视频文件和音频文件的合并。合并代码写在python脚本中，你只需下载好ffmpeg即可，而且因为合并代码中使用ffmpeg的绝对路径，所以也不用设置环境配置。Ffmpe
如何使用 Python 和 FFmpeg 下载 B站视频木觞清 7天熟练Python python ffmpeg 音视频
在这篇文章中，我们将讨论如何使用Python脚本结合FFmpeg下载并合并B站视频的流，生成一个完整的视频文件。具体来说，我们将通过B站的API获取视频的音频和视频流，然后使用FFmpeg下载并将它们合并成一个.mp4文件。前提条件Python：你需要安装Python，推荐使用Python3.6或更高版本。FFmpeg：确保你已经安装并配置好了FFmpeg。如果尚未安装，可以参考FFmpeg官方网
【ai】mocap：conda 安装python3.8+ cuda+ pytorch+torchaudio、torchvision 等风来不如迎风去 AI入门与实战人工智能 ubuntu conda
MotionCapubuntu18.04不知道为啥会依赖于ffmpeg、xorg渲染？安装pytorch就是会带上cudacudnn啥的pytorch【ai】tx2nx：安装torch、torchvisionforyolov5这里就发现pytorch和torchvision有依赖关系的，还涉及到rapidjson所以python的环境隔离很重要。核心库-cudatoolkit=11.3-pytor
视频转音频, 音频转文字言之。 python 音视频
Ubuntu24环境准备#系统级依赖sudoaptupdate&&sudoaptinstall-yffmpegpython3-venvgitbuild-essentialpython3-dev#Python虚拟环境python3-mvenv~/ai_summarysource~/ai_summary/bin/activate核心工具链工具用途安装命令Whisper语音识别pipinstallope
解决开发FFMPEG视频播放器右侧白色线问题吃面不喝汤66 OBS二次开发 ffmpeg 音视频
在开发基于Qt和FFmpeg的视频播放器时，我遇到一个常见但令人困惑的问题：在使用VideoWidget（继承自QOpenGLWidget）播放某些视频时，窗口右侧会出现一条白色线。这不仅影响视觉效果，还可能暴露潜在的渲染或缓冲区问题。本文将详细分析这一现象的成因，并提供经过验证的解决方案。问题现象在使用自定义的VideoDecoder和VideoWidget类播放视频时，大多数视频都能正常显示，
ffmpeg+ubuntu16.04编译ffmpeg库小gpt& QT+FFMPEG实战 ffmpeg linux
个人使用环境：ubuntudesktop16.04+ffmpeg4.2.1以下的库进行完整编译ffmpeg介绍FFmpeg是一个开源的多媒体框架，广泛用于处理音频、视频、字幕等多媒体数据。它包含了丰富的工具和库，能够进行音视频的编解码、转码、流媒体处理、滤镜应用等操作。FFmpeg是许多多媒体应用程序和工具的核心引擎，功能强大且灵活，支持几乎所有常见的音视频格式。FFmpeg的主要组成部分ffmp
从零实现B站视频下载器：Python自动化实战教程木觞清 #编程语言自动化运维
一、项目背景与实现原理1.1B站视频分发机制Bilibili的视频采用音视频分离技术，通过以下方式提升用户体验：动态码率适配（1080P/4K/HDR）分段加载技术（基于M4S格式）内容保护机制（防盗链/签名验证）1.2技术实现路线graphTDA[模拟浏览器请求]-->B[获取加密播放信息]B-->C[解析音视频地址]C-->D[多线程下载]D-->E[FFmpeg合并]二、代码逐层解析2.1请
从FFmpeg命令行到Rust：多场景实战指南 Yeauty ffmpeg rust video-codec
FFmpeg作为功能强大的多媒体处理工具，被广泛应用于视频编辑、格式转换等领域。然而，直接使用FFmpeg的命令行界面（CLI）可能会遇到以下挑战：命令复杂度高：FFmpeg的命令行参数众多且复杂，初学者可能难以掌握，配置错误时调试困难。集成困难：在Rust等现代编程语言中，直接调用FFmpeg的C语言API需要处理复杂的内存管理和安全性问题，可能引发内存泄漏、非法访问等问题。为了解决这些问题，R
从FFmpeg命令行到Rust：多场景实战指南
FFmpeg作为功能强大的多媒体处理工具，被广泛应用于视频编辑、格式转换等领域。然而，直接使用FFmpeg的命令行界面（CLI）可能会遇到以下挑战：命令复杂度高：FFmpeg的命令行参数众多且复杂，初学者可能难以掌握，配置错误时调试困难。集成困难：在Rust等现代编程语言中，直接调用FFmpeg的C语言API需要处理复杂的内存管理和安全性问题，可能引发内存泄漏、非法访问等问题。为了解决这些问题，R
linux CentOS 7.9 安装 ffmpeg 6.0 教程【亲测成功】刘登辉 ffmpeg linux centos
查看当前系统版本[[email protected]]#lsb_release-aLSBVersion::core-4.1-amd64:core-4.1-noarchDistributorID:CentOSDescription:CentOSLinuxrelease7.9.2009(Core)Release:7.9.2009Codename:Corewgethttp://www.ffm
常用的ffmpeg文件格式转换指令儿孙未解供耕织 linux 嵌入式 ffmpeg
mp3转wav:ffmpeg-iinput.mp3-acodecpcm_s16le-ac2-ar44100output.wavwav转m4a:ffmpeg-fwav-itest.wav-ar48000-acodecaac-vn-dntest.m4amp3转mp4:ffmpeg-iREC_START.mp3-codeccopyREC_START.mp4m4a转wav:ffmpeg-iinput.m4
FFMPEG实现音频重采样 QQ_1695710968 音频重采样 FFMPEG PCM
技术在于交流、沟通，转载请注明出处并保持作品的完整性。原文：https://blog.csdn.net/hiwubihe/article/details/81259134[音频编解码系列文章]音频编解码基础FFMPEG实现音频重采样FFMPEG实现PCM编码(采用封装格式实现)FFMPEG实现PCM编码(不采用封装格式实现)FAAC库实现PCM编码FAAD库实现RAW格式AAC解码FAAD库实现R
工业相机视频播放(RTSP) CHHC1880 工业相机 rtsp ffmpeg 推流
需求：工业相机图像能在rtsp流上播放。实现手段：C#利用工业相机的SDK拿到图后，通过ffmpeg管道推给流媒体程序，再转流播放。模拟测试：两张图在rtsp上进行轮播
二.使用ffmpeg对原始音频数据重采样并进行AAC编码 djykkkkkk ffmpeg学习 ffmpeg 音视频 aac
重采样：将音频三元组【采样率采样格式通道数】之中的任何一个或者多个值改变。一.为什么要进行重采样？1.原始音频数据和编码器的数据格式不一致2.播放器要求的和获取的数据不一致3.方便运算二.本次编码流程1.了解自己本机麦克风参数，我的切换为44100/16/2；包括麦克风录音的size可能不一样，本机windows下录音的size为88200；1.ffmpeg获取麦克风数据2.ffmpeg对数据进行
一.ffmpeg打开麦克风，录制音频并重采样 djykkkkkk ffmpeg学习 ffmpeg 音视频
一.windowswindows下使用msys编译ffmpeg，先编译libx264和libx265，然后编译ffmpeg的时候需要添加这两个库的路径才能--enable；为什么ffplay--enable了还是没有呢，仔细看编译打印，可能刚有一段报错提示SDL找不到，这个时候咱们就直接使用msys安装SDL，然后--enable启动sdl，这样ffplay就可以编译成功了。参考这个博主：FFmp
【音视频】ffmpeg中AVpacket解析NALU总结 gma999 音视频 ffmpeg
概述项目中涉及到一些向国标平台推送视频流的逻辑，因之前没有接触过该方面的知识，所以开始走了很多错误的路线，本文主要总结H265视频中解析出NALU方法代码实现输出[tcp@0x55842b7e60]Nodefaultwhitelistset[tcp@0x55842b7e60]Originallistofaddresses:[tcp@0x55842b7e60]Address192.168.1.181
laravel项目中使用FFMPeg 剪裁视频道系女孩~ php laravel
#运行环境需安装的软件ffmpeg#安装的扩展pbmedia/laravel-ffmpeg:^8.3#扩展文档https://packagist.org/packages/pbmedia/laravel-ffmpeg#引入的类useFFMpeg\Coordinate\TimeCode;useFFMpeg\Format\Video\X264;useFFMpeg\Exception\RuntimeEx
音视频入门基础：RTP专题（18）——FFmpeg源码中，获取RTP的音频信息的实现（上）崔杰城音视频技术 FFmpeg源码分析音视频 ffmpeg
由于本文篇幅较长，分为上、下两篇。一、引言通过FFmpeg命令可以获取到SDP描述的RTP流的的音频压缩编码格式、音频压缩编码格式的profile、音频采样率、通道数信息：ffmpeg-protocol_whitelist"file,rtp,udp"-iXXX.sdp而由《音视频入门基础：RTP专题（17）——音频的SDP媒体描述》可以知道，SDP协议中，a=rtpmap属性和a=fmtp属性中的
Qt+ffmpeg环境搭建技术不支持 qt ffmpeg 开发语言
Qt+ffmpeg环境搭建各平台常见视频开发库举例:iOS：AVFoundationAudioUnitAndroid：MediaPlayer，MediaCodecWindows：DirectShowLinux：GStreamerFFmpeg库是一个跨平台的视频开发库,还有libVLC也是一个跨平台的视频开发库掌握了其中一个库,也能很快上手其它库,因为音视频解码的原理类似引入FFmpeg库有两种方式
QT+FFmpeg+Windows开发环境搭建（加薪点） Qt历险记 Qt 高级开发工程师 qt ffmpeg windows
01、Windows环境搭建FFMPEG官网：http://ffmpeg.org/02、下载4.2.1版本源码源码：https://ffmpeg.org/releases/ffmpeg-4.2.1.tar.bz203、下载4.2.1编译好的文件下载已经编译好的FFMPEG）（迅雷下载很快）网址：https://ffmpeg.zeranoe.com/builds/32位下载地址：
Qt | Windows环境搭建ffmpeg Qt历险记 Qt 高级开发工程师 qt windows ffmpeg
点击上方"蓝字"关注我们FFMPEG官网>>>http://ffmpeg.org/【下载4.2.1版本源码】源码：https://ffmpeg.org/releases/ffmpeg-4.2.1.tar.bz2【下载4.2.1编译好的文件】下载已经编译好的FFMPEG网址：https://ffmpeg.zeranoe.com/builds/
Python爬虫教程：如何通过接口批量下载视频封面（FFmpeg技术实现） Python爬虫项目 python 爬虫开发语言数据库数据分析 scrapy selenium
引言随着在线视频平台的蓬勃发展，视频封面作为视频内容的预览图，一直以来都是观众对视频的第一印象。在爬取视频资源时，很多开发者和研究者往往只关注视频本身，而忽略了视频封面。实际上，视频封面不仅能提供重要的信息（例如视频标题、主题或情感等），而且它们也能作为数据集中的重要属性，用于视频分类、推荐系统等应用。在这篇博客中，我们将深入探讨如何使用Python通过接口批量下载视频封面，利用FFmpeg等技术
三分钟掌握音视频信息查询 | 在 Rust 中优雅地集成 FFmpeg Yeauty 音视频 rust ffmpeg
前言在音视频处理领域，开发者常常需要获取媒体文件的详细信息，如时长、格式、元数据，以及音视频流的编码参数等。这些信息对于媒体管理、转码调度、播放控制等场景至关重要。然而，直接使用FFmpeg命令行工具或其原生API存在以下挑战：命令行工具的复杂性：FFmpeg的命令行参数众多且复杂，使用不当可能导致错误。例如，处理包含空格的文件名时，需要特别注意正确的转义和引用方式，否则可能导致无法识别文件名的问
『FFmpeg学习笔记』MAC系统电脑安装FFmpeg以及使用 AI大模型前沿研究大模型笔记 macos ffmpeg M1
MAC系统电脑安装FFmpeg文章目录一.安装FFmpeg1.1.MACbrew安装FFmpeg1.2.MAC官网下载FFmpeg压缩包1.3.Windows安装1.4.Linux安装二.FFmpeg的使用2.1.音频操作2.1.1.如果不转换，直接输出aac2.1.2.将音频输出为wav2.1.3.将aac转换为wav2.1.4.双声道分离2.1.5.使用FFmpeg将音频和视频合并2.2.字幕
MPV Player(MPV播放器) fhfhgfdgdsgi1 tornado
链接：https://pan.quark.cn/s/a6b4b644bb16MPVPlayer(MPV播放器)是mplayer2和MPlayer的一个分支，支持多种视频文件格式、音频和视频编解码器以及字幕类型。它通过FFmpeg提供硬件加速，支持VDPAU和VAAPI以及Windows上的DXVA2，以及VDA和VideoToolbox视频。mpv可以播放互联网广播流、视频流、“实时”应用各种音频
【视频】ffmpeg、Nginx搭建RTMP、HLS服务器郭老二视频音视频 ffmpeg nginx
1、源码安装Nginx1）源码下载因为要使用Nginx的模块nginx-rtmp-module，所以要下载nginx和nginx-rtmp-module的源码。下载地址：http://nginx.org/en/download.htmlhttps://github.com/arut/nginx-rtmp-module/tags2）解压、配置在同一个目录中解压nginx和nginx-rtmp-mod
【视频】V4L2、ffmpeg、OpenCV中对YUV的定义郭老二视频音视频 ffmpeg opencv
1、常见的YUV格式1.1YUV420每像素16位IMC1：YYYYYYYYVV--UU–IMC3：YYYYYYYYUU--VV–每像素12位I420:YYYYYYYYUUVV=>YUV420PYV12:YYYYYYYYVVUU=>YUV420PNV12:YYYYYYYYUVUV=>YUV420SP（最受欢迎格式）NV21:YYYYYYYYVUVU=>YUV420SPIMC2：YYYYYYYYYY
msys2+mingw编译ffmpeg 星火撩猿音视频集 msys2 ffmpeg
MinGW安装ffmpeg下载ffmpeg源码源码下载编译安装ffmpeg./configure--prefix=/usr/local/ffmpeg（生成makefile文件）make-j4（多进程并行编译节省编译时间）makeinstall（安装到指定目录）
利用Qt + OpenGL 渲染 YUV数据，播放视频 mac版 jake2012 OpenGL Qt Qt 3D C/C++
最近利用Qt渲染YUV数据，折腾了很久，最开始使用FFmpeg将YUV数据转换成RGB数据后在用qt绘制，很快得到了成功，但是cpu占用率太大，最后放弃了。在这先感谢来自文章http://blog.csdn.net/su_vast/article/details/52214642的作者，使用他的代码我实现了Windows上的YUV数据渲染。但是移植到mac上渲染不出来，经过折腾及对OpenGL的了
【GB28181】H265-Nalu的封装 gma999 网络
概述通过国标摄像头拉流，ffmpeg解码可以得到如下日志信息[rtsp@0x55842ed950]videocodecsetto:hevc[rtp@0x55842b7cc0]Nodefaultwhitelistset[udp@0x55842bb400]Nodefaultwhitelistset[udp@0x55842bb400]endreceivebuffersizereportedis13107
Algorithm 香水浓 java Algorithm
冒泡排序 public static void sort(Integer[] param) { for (int i = param.length - 1; i > 0; i--) { for (int j = 0; j < i; j++) { int current = param[j]; int next = param[j + 1];
mongoDB 复杂查询表达式开窍的石头 mongodb
1:count Pg: db.user.find().count(); 统计多少条数据 2:不等于$ne Pg: db.user.find({_id:{$ne:3}},{name:1,sex:1,_id:0}); 查询id不等于3的数据。 3：大于$gt $gte(大于等于) &n
Jboss Java heap space异常解决方法, jboss OutOfMemoryError : PermGen space 0624chenhong jvm jboss
转自 http://blog.csdn.net/zou274/article/details/5552630 解决办法： window->preferences->java->installed jres->edit jre 把default vm arguments 的参数设为-Xms64m -Xmx512m ----------------
文件上传下载解析相对路径不懂事的小屁孩文件上传
有点坑吧，弄这么一个简单的东西弄了一天多，身边还有大神指导着，网上各种百度着。下面总结一下遇到的问题：文件上传，在页面上传的时候，不要想着去操作绝对路径，浏览器会对客户端的信息进行保护，避免用户信息收到攻击。在上传图片，或者文件时，使用form表单来操作。前台通过form表单传输一个流到后台，而不是ajax传递参数到后台，代码如下: <form action=&
怎么实现qq空间批量点赞换个号韩国红果果 qq
纯粹为了好玩！！逻辑很简单 1 打开浏览器console；输入以下代码。先上添加赞的代码 var tools={}; //添加所有赞 function init(){ document.body.scrollTop=10000; setTimeout(function(){document.body.scrollTop=0;},2000);//加
判断是否为中文灵静志远中文
方法一： public class Zhidao { public static void main(String args[]) { String s = "sdf灭礌 kjl d{';\fdsjlk是"; int n=0; for(int i=0; i<s.length(); i++) { n = (int)s.charAt(i); if((
一个电话面试后总结 a-john 面试
今天，接了一个电话面试，对于还是初学者的我来说，紧张了半天。面试的问题分了层次，对于一类问题，由简到难。自己觉得回答不好的地方作了一下总结：在谈到集合类的时候，举几个常用的集合类，想都没想，直接说了list,map。然后对list和map分别举几个类型： list方面：ArrayList,LinkedList。在谈到他们的区别时，愣住了
MSSQL中Escape转义的使用 aijuans MSSQL
IF OBJECT_ID('tempdb..#ABC') is not null drop table tempdb..#ABC create table #ABC ( PATHNAME NVARCHAR(50) ) insert into #ABC SELECT N'/ABCDEFGHI' UNION ALL SELECT N'/ABCDGAFGASASSDFA' UNION ALL
一个简单的存储过程 asialee mysql 存储过程构造数据批量插入
今天要批量的生成一批测试数据，其中中间有部分数据是变化的，本来想写个程序来生成的，后来想到存储过程就可以搞定，所以随手写了一个，记录在此： DELIMITER $$ DROP PROCEDURE IF EXISTS inse
annot convert from HomeFragment_1 to Fragment 百合不是茶 android 导包错误
创建了几个类继承Fragment, 需要将创建的类存储在ArrayList<Fragment>中; 出现不能将new 出来的对象放到队列中,原因很简单; 创建类时引入包是:import android.app.Fragment; 创建队列和对象时使用的包是:import android.support.v4.ap
Weblogic10两种修改端口的方法 bijian1013 weblogic 端口号配置管理 config.xml
一.进入控制台进行修改 1.进入控制台: http://127.0.0.1:7001/console 2.展开左边树菜单域结构->环境->服务器-->点击AdminServer(管理) &
mysql 操作指令征客丶 mysql
一、连接mysql 进入 mysql 的安装目录； $ bin/mysql -p [host IP 如果是登录本地的mysql 可以不写 -p 直接 -u] -u [userName] -p 输入密码，回车，接连；二、权限操作［如果你很了解mysql数据库后，你可以直接去修改系统表，然后用 mysql> flush privileges; 指令让权限生效］ 1、赋权 mys
【Hive一】Hive入门 bit1129 hive
Hive安装与配置 Hive的运行需要依赖于Hadoop，因此需要首先安装Hadoop2.5.2，并且Hive的启动前需要首先启动Hadoop。 Hive安装和配置的步骤 1. 从如下地址下载Hive0.14.0 http://mirror.bit.edu.cn/apache/hive/ 2.解压hive，在系统变
ajax 三种提交请求的方法 BlueSkator Ajax jqery
1、ajax 提交请求 $.ajax({ type:"post", url : "${ctx}/front/Hotel/getAllHotelByAjax.do", dataType : "json", success : function(result) { try { for(v
mongodb开发环境下的搭建入门 braveCS 运维
linux下安装mongodb 1）官网下载mongodb-linux-x86_64-rhel62-3.0.4.gz 2）linux 解压 gzip -d mongodb-linux-x86_64-rhel62-3.0.4.gz; mv mongodb-linux-x86_64-rhel62-3.0.4 mongodb-linux-x86_64-rhel62-
编程之美-最短摘要的生成 bylijinnan java 数据结构算法编程之美
import java.util.HashMap; import java.util.Map; import java.util.Map.Entry; public class ShortestAbstract { /** * 编程之美最短摘要的生成 * 扫描过程始终保持一个[pBegin,pEnd]的range,初始化确保[pBegin,pEnd]的ran
json数据解析及typeof chengxuyuancsdn js typeof json解析
// json格式 var people='{"authors": [{"firstName": "AAA","lastName": "BBB"},' +' {"firstName": "CCC&
流程系统设计的层次和目标 comsci 设计模式数据结构 sql 框架脚本
流程系统设计的层次和目标
RMAN List和report 命令 daizj oracle list report rman
LIST 命令使用RMAN LIST 命令显示有关资料档案库中记录的备份集、代理副本和映像副本的信息。使用此命令可列出： • RMAN 资料档案库中状态不是AVAILABLE 的备份和副本 • 可用的且可以用于还原操作的数据文件备份和副本 • 备份集和副本，其中包含指定数据文件列表或指定表空间的备份 • 包含指定名称或范围的所有归档日志备份的备份集和副本 • 由标记、完成时间、可
二叉树:红黑树 dieslrae 二叉树
红黑树是一种自平衡的二叉树,它的查找,插入,删除操作时间复杂度皆为O(logN),不会出现普通二叉搜索树在最差情况时时间复杂度会变为O(N)的问题. 红黑树必须遵循红黑规则,规则如下 1、每个节点不是红就是黑。 2、根总是黑的 &
C语言homework3，7个小题目的代码 dcj3sjt126com c
1、打印100以内的所有奇数。 # include <stdio.h> int main(void) { int i; for (i=1; i<=100; i++) { if (i%2 != 0) printf("%d ", i); } return 0; } 2、从键盘上输入10个整数，
自定义按钮, 图片在上, 文字在下, 居中显示 dcj3sjt126com 自定义
#import <UIKit/UIKit.h> @interface MyButton : UIButton -(void)setFrame:(CGRect)frame ImageName:(NSString*)imageName Target:(id)target Action:(SEL)action Title:(NSString*)title Font:(CGFloa
MySQL查询语句练习题，测试足够用了 flyvszhb sql mysql
http://blog.sina.com.cn/s/blog_767d65530101861c.html 1.创建student和score表 CREATE TABLE student ( id INT(10) NOT NULL UNIQUE PRIMARY KEY , name VARCHAR
转：MyBatis Generator 详解 happyqing mybatis
MyBatis Generator 详解 http://blog.csdn.net/isea533/article/details/42102297 MyBatis Generator详解 http://git.oschina.net/free/Mybatis_Utils/blob/master/MybatisGeneator/MybatisGeneator.
让程序员少走弯路的14个忠告 jingjing0907 工作计划学习
无论是谁，在刚进入某个领域之时，有再大的雄心壮志也敌不过眼前的迷茫：不知道应该怎么做，不知道应该做什么。下面是一名软件开发人员所学到的经验，希望能对大家有所帮助 1.不要害怕在工作中学习。只要有电脑，就可以通过电子阅读器阅读报纸和大多数书籍。如果你只是做好自己的本职工作以及分配的任务，那是学不到很多东西的。如果你盲目地要求更多的工作，也是不可能提升自己的。放
nginx和NetScaler区别流浪鱼 nginx
NetScaler是一个完整的包含操作系统和应用交付功能的产品，Nginx并不包含操作系统，在处理连接方面，需要依赖于操作系统，所以在并发连接数方面和防DoS攻击方面，Nginx不具备优势。 2.易用性方面差别也比较大。Nginx对管理员的水平要求比较高，参数比较多，不确定性给运营带来隐患。在NetScaler常见的配置如健康检查，HA等，在Nginx上的配置的实现相对复杂。 3.策略灵活度方
第11章动画效果（下） onestopweb 动画
index.html <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/
FAQ - SAP BW BO roadmap blueoxygen BO BW
http://www.sdn.sap.com/irj/boc/business-objects-for-sap-faq Besides, I care that how to integrate tightly. By the way, for BW consultants, please just focus on Query Designer which i
关于java堆内存溢出的几种情况 tomcat_oracle java jvm jdk thread
【情况一】：　　 java.lang.OutOfMemoryError: Java heap space：这种是java堆内存不够，一个原因是真不够，另一个原因是程序中有死循环；　　如果是java堆内存不够的话，可以通过调整JVM下面的配置来解决：　　<jvm-arg>-Xms3062m</jvm-arg> 　　<jvm-arg>-Xmx
Manifest.permission_group权限组阿尔萨斯 Permission
结构继承关系 public static final class Manifest.permission_group extends Object java.lang.Object android. Manifest.permission_group 常量 ACCOUNTS 直接通过统计管理器访问管理的统计 COST_MONEY可以用来让用户花钱但不需要通过与他们直接牵涉的权限 D