OSDN Git Service

Don't discard titles during scan just because of a read failure on one or more of...
[handbrake-jp/handbrake-jp-git.git] / libhb / encx264.c
index 747bae9..95922d5 100644 (file)
@@ -23,12 +23,22 @@ hb_work_object_t hb_encx264 =
     encx264Close
 };
 
+// 16 is probably overkill but it's also the maximum for h.264 reference frames
+#define MAX_INFLIGHT_FRAMES 16
+
 struct hb_work_private_s
 {
     hb_job_t       * job;
     x264_t         * x264;
     x264_picture_t   pic_in;
-    x264_picture_t   pic_out;
+
+    // Internal queue of DTS start/stop values.
+    int64_t        dts_start[MAX_INFLIGHT_FRAMES];
+    int64_t        dts_stop[MAX_INFLIGHT_FRAMES];
+
+    int64_t        dts_write_index;
+    int64_t        dts_read_index;
+    int64_t        next_chap;
 
     char             filename[1024];
 };
@@ -54,142 +64,154 @@ int encx264Init( hb_work_object_t * w, hb_job_t * job )
 
     x264_param_default( &param );
 
-    param.i_threads    = hb_get_cpu_count();
+    param.i_threads    = ( hb_get_cpu_count() * 3 / 2 );
     param.i_width      = job->width;
     param.i_height     = job->height;
     param.i_fps_num    = job->vrate;
     param.i_fps_den    = job->vrate_base;
     param.i_keyint_max = 20 * job->vrate / job->vrate_base;
     param.i_log_level  = X264_LOG_INFO;
-       if( job->h264_level )
-       {
-       param.i_threads   = 1;
-       param.b_cabac     = 0;
-       param.i_level_idc = job->h264_level;
-       hb_log( "encx264: encoding at level %i",
-               param.i_level_idc );
-       }
-
-       /* Slightly faster with minimal quality lost */
-       param.analyse.i_subpel_refine = 4;
-
-       /*      This section passes the string x264opts to libx264 for parsing into parameter names and values.
-
-       The string is set up like this:
-       option1=value1:option2=value 2
-
-       So, you have to iterate through based on the colons, and then put the left side of the equals sign in "name"
-       and the right side into "value." Then you hand those strings off to x264 for interpretation.
-
-       This is all based on the universal x264 option handling Loren Merritt implemented in the Mplayer/Mencoder project.
-       */
-       char *x264opts = job->x264opts;
-       if(x264opts != NULL && *x264opts != '\0')
-       {
-               while(*x264opts)
-               {
-               char *name = x264opts;
-               char *value;
-               int ret;
-
-               x264opts += strcspn(x264opts, ":");
-               if(*x264opts)
-                       {
-                       *x264opts = 0;
-                       x264opts++;
-                       }
-
-               value = strchr( name, '=' );
-               if(value)
-                       {
-                       *value = 0;
-                       value++;
-                       }
-               
-                       /*
-                               When B-frames are enabled, the max frame count increments by 1 (regardless of the number of B-frames).
-                               If you don't change the duration of the video track when you mux, libmp4 barfs.
-                               So, check if the x264opts are using B-frames, and when they are, set the boolean job->areBframes as true.
-                       */
-
-                       if (!(strcmp(name, "bframes")))
-                       {
-                               if (atoi(value) > 0)
-                               {
-                                       job->areBframes = 1;
-                               }
-                       }
+    if( job->h264_level )
+    {
+        param.b_cabac     = 0;
+        param.i_level_idc = job->h264_level;
+        hb_log( "encx264: encoding at level %i",
+                param.i_level_idc );
+    }
+
+    /* Slightly faster with minimal quality lost */
+    param.analyse.i_subpel_refine = 4;
+
+    /*
+               This section passes the string x264opts to libx264 for parsing into 
+        parameter names and values.
+
+        The string is set up like this:
+        option1=value1:option2=value 2
+
+        So, you have to iterate through based on the colons, and then put 
+        the left side of the equals sign in "name" and the right side into
+        "value." Then you hand those strings off to x264 for interpretation.
+
+        This is all based on the universal x264 option handling Loren
+        Merritt implemented in the Mplayer/Mencoder project.
+     */
+
+    char *x264opts = job->x264opts;
+    if( x264opts != NULL && *x264opts != '\0' )
+    {
+        while( *x264opts )
+        {
+            char *name = x264opts;
+            char *value;
+            int ret;
+
+            x264opts += strcspn( x264opts, ":" );
+            if( *x264opts )
+            {
+                *x264opts = 0;
+                x264opts++;
+            }
+
+            value = strchr( name, '=' );
+            if( value )
+            {
+                *value = 0;
+                value++;
+            }
+
+            /*
+               When B-frames are enabled, the max frame count increments
+               by 1 (regardless of the number of B-frames). If you don't
+               change the duration of the video track when you mux, libmp4
+               barfs.  So, check if the x264opts are using B-frames, and
+               when they are, set the boolean job->areBframes as true.
+             */
+
+            if( !( strcmp( name, "bframes" ) ) )
+            {
+                if( atoi( value ) > 0 )
+                {
+                    job->areBframes = 1;
+                }
+            }
 
             /* Note b-pyramid here, so the initial delay can be doubled */
-            if (!(strcmp(name, "b-pyramid")))
+            if( !( strcmp( name, "b-pyramid" ) ) )
             {
-                   if (atoi(value) > 0)
-                   {
-                           job->areBframes = 2;
-                   }
+                if( value != NULL )
+                {
+                    if( atoi( value ) > 0 )
+                    {
+                        job->areBframes = 2;
+                    }
+                }
+                else
+                {
+                    job->areBframes = 2;
+                }
             }
-                       
+
             /* Here's where the strings are passed to libx264 for parsing. */
-               ret = x264_param_parse(&param, name, value);
-       
-                       /*      Let x264 sanity check the options for us*/
-               if(ret == X264_PARAM_BAD_NAME)
-                       printf("x264 options: Unknown suboption %s\n", name);
-               if(ret == X264_PARAM_BAD_VALUE)
-                       printf("x264 options: Bad argument %s=%s\n", name, value ? value : "(null)");
-               }
-       }
-
-
-       if( job->pixel_ratio )
-       {
-           param.vui.i_sar_width = job->pixel_aspect_width;
-           param.vui.i_sar_height = job->pixel_aspect_height;
-
-           hb_log( "encx264: encoding with stored aspect %d/%d",
-                   param.vui.i_sar_width, param.vui.i_sar_height );
-       }
-
-
-       if( job->vquality >= 0.0 && job->vquality <= 1.0 )
-       {
-           switch(job->crf)
-               {
-                       case 1:
-                       /*Constant RF*/
-                       param.rc.i_rc_method = X264_RC_CRF;
-                       param.rc.f_rf_constant = 51 - job->vquality * 51;
-                       hb_log( "encx264: Encoding at constant RF %f",
-                               param.rc.f_rf_constant );
-                       break;
-
-                       case 0:
-                       /*Constant QP*/
-                       param.rc.i_rc_method = X264_RC_CQP;
-               param.rc.i_qp_constant = 51 - job->vquality * 51;
-               hb_log( "encx264: encoding at constant QP %d",
-                   param.rc.i_qp_constant );
-                       break;
-               }
-       }
-       else
-       {
-       /* Rate control */
-           param.rc.i_rc_method = X264_RC_ABR;
-           param.rc.i_bitrate = job->vbitrate;
-           switch( job->pass )
-           {
-               case 1:
-                   param.rc.b_stat_write  = 1;
-                   param.rc.psz_stat_out = pv->filename;
-                   break;
-               case 2:
-                   param.rc.b_stat_read = 1;
-                   param.rc.psz_stat_in = pv->filename;
-                   break;
-           }
-       }
+            ret = x264_param_parse( &param, name, value );
+
+            /*         Let x264 sanity check the options for us*/
+            if( ret == X264_PARAM_BAD_NAME )
+                hb_log( "x264 options: Unknown suboption %s", name );
+            if( ret == X264_PARAM_BAD_VALUE )
+                hb_log( "x264 options: Bad argument %s=%s", name, value ? value : "(null)" );
+        }
+    }
+
+
+    if( job->pixel_ratio )
+    {
+        param.vui.i_sar_width = job->pixel_aspect_width;
+        param.vui.i_sar_height = job->pixel_aspect_height;
+
+        hb_log( "encx264: encoding with stored aspect %d/%d",
+                param.vui.i_sar_width, param.vui.i_sar_height );
+    }
+
+
+    if( job->vquality >= 0.0 && job->vquality <= 1.0 )
+    {
+        switch( job->crf )
+        {
+            case 1:
+                /*Constant RF*/
+                param.rc.i_rc_method = X264_RC_CRF;
+                param.rc.f_rf_constant = 51 - job->vquality * 51;
+                hb_log( "encx264: Encoding at constant RF %f",
+                        param.rc.f_rf_constant );
+                break;
+
+            case 0:
+                /*Constant QP*/
+                param.rc.i_rc_method = X264_RC_CQP;
+                param.rc.i_qp_constant = 51 - job->vquality * 51;
+                hb_log( "encx264: encoding at constant QP %d",
+                        param.rc.i_qp_constant );
+                break;
+        }
+    }
+    else
+    {
+        /* Rate control */
+        param.rc.i_rc_method = X264_RC_ABR;
+        param.rc.i_bitrate = job->vbitrate;
+        switch( job->pass )
+        {
+            case 1:
+                param.rc.b_stat_write  = 1;
+                param.rc.psz_stat_out = pv->filename;
+                break;
+            case 2:
+                param.rc.b_stat_read = 1;
+                param.rc.psz_stat_in = pv->filename;
+                break;
+        }
+    }
 
     hb_log( "encx264: opening libx264 (pass %d)", job->pass );
     pv->x264 = x264_encoder_open( &param );
@@ -207,7 +229,11 @@ int encx264Init( hb_work_object_t * w, hb_job_t * job )
     memcpy( &w->config->h264.pps[1], nal[2].p_payload, nal[2].i_payload );
 
     x264_picture_alloc( &pv->pic_in, X264_CSP_I420,
-                        job->width, job->height );
+            job->width, job->height );
+
+    pv->dts_write_index = 0;
+    pv->dts_read_index = 0;
+    pv->next_chap = 0;
 
     return 0;
 }
@@ -215,7 +241,10 @@ int encx264Init( hb_work_object_t * w, hb_job_t * job )
 void encx264Close( hb_work_object_t * w )
 {
     hb_work_private_t * pv = w->private_data;
+    x264_picture_clean( &pv->pic_in );
     x264_encoder_close( pv->x264 );
+    free( pv );
+    w->private_data = NULL;
 
     /* TODO */
 }
@@ -226,112 +255,187 @@ int encx264Work( hb_work_object_t * w, hb_buffer_t ** buf_in,
     hb_work_private_t * pv = w->private_data;
     hb_job_t    * job = pv->job;
     hb_buffer_t * in = *buf_in, * buf;
+    x264_picture_t   pic_out;
     int           i_nal;
     x264_nal_t  * nal;
     int i;
 
-    /* XXX avoid this memcpy ? */
-    memcpy( pv->pic_in.img.plane[0], in->data, job->width * job->height );
-    if( job->grayscale )
-    {
-        /* XXX x264 has currently no option for grayscale encoding */
-        memset( pv->pic_in.img.plane[1], 0x80, job->width * job->height / 4 );
-        memset( pv->pic_in.img.plane[2], 0x80, job->width * job->height / 4 );
-    }
-    else
+    if( in->data )
     {
-        memcpy( pv->pic_in.img.plane[1], in->data + job->width * job->height,
-                job->width * job->height / 4 );
-        memcpy( pv->pic_in.img.plane[2], in->data + 5 * job->width *
-                job->height / 4, job->width * job->height / 4 );
-    }
-
-    pv->pic_in.i_type    = X264_TYPE_AUTO;
-    pv->pic_in.i_qpplus1 = 0;
-
-    /* Feed the input DTS to x264 so it can figure out proper output PTS */
-    pv->pic_in.i_pts = in->start;
-
-    x264_encoder_encode( pv->x264, &nal, &i_nal,
-                         &pv->pic_in, &pv->pic_out );
-
-    /* Should be way too large */
-    buf        = hb_buffer_init( 3 * job->width * job->height / 2 );
-    buf->size  = 0;
-    buf->start = in->start;
-    buf->stop  = in->stop;
-    buf->key   = 0;
-
-    for( i = 0; i < i_nal; i++ )
-    {
-        int size, data;
-
-        data = buf->alloc - buf->size;
-        if( ( size = x264_nal_encode( buf->data + buf->size, &data,
-                                      1, &nal[i] ) ) < 1 )
+        /* XXX avoid this memcpy ? */
+        memcpy( pv->pic_in.img.plane[0], in->data, job->width * job->height );
+        if( job->grayscale )
         {
-            continue;
+            /* XXX x264 has currently no option for grayscale encoding */
+            memset( pv->pic_in.img.plane[1], 0x80, job->width * job->height / 4 );
+            memset( pv->pic_in.img.plane[2], 0x80, job->width * job->height / 4 );
+        }
+        else
+        {
+            memcpy( pv->pic_in.img.plane[1], in->data + job->width * job->height,
+                    job->width * job->height / 4 );
+            memcpy( pv->pic_in.img.plane[2], in->data + 5 * job->width *
+                    job->height / 4, job->width * job->height / 4 );
         }
 
-        if( job->mux & HB_MUX_AVI )
+        if( in->new_chap && job->chapter_markers )
         {
-            if( nal[i].i_ref_idc == NAL_PRIORITY_HIGHEST )
+            /* chapters have to start with an IDR frame so request that this
+               frame be coded as IDR. Since there may be up to 16 frames
+               currently buffered in the encoder remember the timestamp so
+               when this frame finally pops out of the encoder we'll mark
+               its buffer as the start of a chapter. */
+            pv->pic_in.i_type = X264_TYPE_IDR;
+            if( pv->next_chap == 0 )
             {
-                buf->key = 1;
+                pv->next_chap = in->start;
             }
-            buf->size += size;
-            continue;
+            /* don't let 'work_loop' put a chapter mark on the wrong buffer */
+            in->new_chap = 0;
         }
-
-        /* H.264 in .mp4 */
-        switch( buf->data[buf->size+4] & 0x1f )
+        else
         {
-            case 0x7:
-            case 0x8:
-                /* SPS, PPS */
-                break;
+            pv->pic_in.i_type = X264_TYPE_AUTO;
+        }
+        pv->pic_in.i_qpplus1 = 0;
 
-            default:
-                /* H.264 in mp4 (stolen from mp4creator) */
-                buf->data[buf->size+0] = ( ( size - 4 ) >> 24 ) & 0xFF;
-                buf->data[buf->size+1] = ( ( size - 4 ) >> 16 ) & 0xFF;
-                buf->data[buf->size+2] = ( ( size - 4 ) >>  8 ) & 0xFF;
-                buf->data[buf->size+3] = ( ( size - 4 ) >>  0 ) & 0xFF;
+        // Remember current PTS value, use as DTS later
+        pv->dts_start[pv->dts_write_index & (MAX_INFLIGHT_FRAMES-1)] = in->start;
+        pv->dts_stop[pv->dts_write_index & (MAX_INFLIGHT_FRAMES-1)]  = in->stop;
+        pv->dts_write_index++;
 
-        /* For IDR (key frames), buf->key = 1,
-           and the same for regular I-frames. */
-        if( (pv->pic_out.i_type == X264_TYPE_IDR) || (pv->pic_out.i_type == X264_TYPE_I) )
-        {
-        buf->key = 1;
-        }
-        /* For B-frames, buf->key = 2 */
-        else if( (pv->pic_out.i_type == X264_TYPE_B) )
-        {
-        buf->key = 2;
-        }                
-        /* This is for b-pyramid, which has reference b-frames
-           However, it doesn't seem to ever be used...
-           They just show up as buf->key == 2 like
-           regular b-frames. */
-        else if( (pv->pic_out.i_type == X264_TYPE_BREF) )
+        /* Feed the input DTS to x264 so it can figure out proper output PTS */
+        pv->pic_in.i_pts = in->start;
+
+        x264_encoder_encode( pv->x264, &nal, &i_nal,
+                             &pv->pic_in, &pic_out );        
+    }
+    else
+    {
+        x264_encoder_encode( pv->x264, &nal, &i_nal,
+                             NULL, &pic_out );
+        /* No more delayed B frames */
+        if( i_nal == 0 )
         {
-            buf->key = 3;
+            *buf_out = NULL;
+            return HB_WORK_DONE;
         }
-        /* For P-frames, buf->key = 0 */
         else
         {
-            buf->key = 0;
+        /*  Since we output at least one more frame, drop another empty
+            one onto our input fifo.  We'll keep doing this automatically
+            until we stop getting frames out of the encoder. */
+            hb_fifo_push(w->fifo_in, hb_buffer_init(0));
         }
+    }
+
+    if( i_nal )
+    {
+        /* Should be way too large */
+        buf        = hb_buffer_init( 3 * job->width * job->height / 2 );
+        buf->size  = 0;
+        buf->start = in->start;
+        buf->stop  = in->stop;
+        buf->frametype   = 0;
+
+        int64_t dts_start, dts_stop;
 
-        /* Store the output presentation time stamp
-           from x264 for use by muxmp4 in off-setting
-           b-frames with the CTTS atom. */
-        buf->encodedPTS = pv->pic_out.i_pts;
+        /* Get next DTS value to use */
+        dts_start = pv->dts_start[pv->dts_read_index & (MAX_INFLIGHT_FRAMES-1)];
+        dts_stop  = pv->dts_stop[pv->dts_read_index & (MAX_INFLIGHT_FRAMES-1)];
+        pv->dts_read_index++;
 
+        for( i = 0; i < i_nal; i++ )
+        {
+            int size, data;
+
+            data = buf->alloc - buf->size;
+            if( ( size = x264_nal_encode( buf->data + buf->size, &data,
+                                          1, &nal[i] ) ) < 1 )
+            {
+                continue;
+            }
+
+            if( job->mux & HB_MUX_AVI )
+            {
+                if( nal[i].i_ref_idc == NAL_PRIORITY_HIGHEST )
+                {
+                    buf->frametype = HB_FRAME_KEY;
+                }
                 buf->size += size;
+                continue;
+            }
+
+            /* H.264 in .mp4 */
+            switch( buf->data[buf->size+4] & 0x1f )
+            {
+                case 0x7:
+                case 0x8:
+                    /* SPS, PPS */
+                    break;
+
+                default:
+                    /* H.264 in mp4 (stolen from mp4creator) */
+                    buf->data[buf->size+0] = ( ( size - 4 ) >> 24 ) & 0xFF;
+                    buf->data[buf->size+1] = ( ( size - 4 ) >> 16 ) & 0xFF;
+                    buf->data[buf->size+2] = ( ( size - 4 ) >>  8 ) & 0xFF;
+                    buf->data[buf->size+3] = ( ( size - 4 ) >>  0 ) & 0xFF;
+                    switch( pic_out.i_type )
+                    {
+                    /*  Decide what type of frame we have. */
+                        case X264_TYPE_IDR:
+                            buf->frametype = HB_FRAME_IDR;
+                            /* if we have a chapter marker pending and this
+                               frame's presentation time stamp is at or after
+                               the marker's time stamp, use this as the
+                               chapter start. */
+                            if( pv->next_chap != 0 && pv->next_chap <= pic_out.i_pts )
+                            {
+                                pv->next_chap = 0;
+                                buf->new_chap = 1;
+                            }
+                            break;
+                        case X264_TYPE_I:
+                            buf->frametype = HB_FRAME_I;
+                            break;
+                        case X264_TYPE_P:
+                            buf->frametype = HB_FRAME_P;
+                            break;
+                        case X264_TYPE_B:
+                            buf->frametype = HB_FRAME_B;
+                            break;
+                    /*  This is for b-pyramid, which has reference b-frames
+                        However, it doesn't seem to ever be used... */
+                        case X264_TYPE_BREF:
+                            buf->frametype = HB_FRAME_BREF;
+                            break;
+                    /*  If it isn't the above, what type of frame is it?? */
+                        default:
+                            buf->frametype = 0;
+                    }
+
+
+                    /* Store the output presentation time stamp
+                       from x264 for use by muxmp4 in off-setting
+                       b-frames with the CTTS atom.
+                       For now, just add 1000000 to the offset so that the
+                       value is pretty much guaranteed to be positive.  The
+                       muxing code will minimize the renderOffset at the end. */
+
+                    buf->renderOffset = pic_out.i_pts - dts_start + 1000000;
+
+                    /* Send out the next dts values */
+                    buf->start = dts_start;
+                    buf->stop  = dts_stop;
+
+                    buf->size += size;
+            }
         }
     }
 
+    else
+        buf = NULL;
+
     *buf_out = buf;
 
     return HB_WORK_OK;