Allow mac gui to select AC-3 + AAC at the same time, still needs CLI work for the...

[handbrake-jp/handbrake-jp-git.git] / libhb / sync.c
diff --git a/libhb/sync.c b/libhb/sync.c

index c73ea8c..8bdf0c2 100644 (file)
--- a/libhb/sync.c
+++ b/libhb/sync.c
@@ -40,6 +40,7 @@ struct hb_work_private_s
      hb_subtitle_t * subtitle;
      int64_t pts_offset;
      int64_t pts_offset_old;
+    int64_t next_start;
      int64_t count_frames;
      int64_t count_frames_max;
      int64_t video_sequence;
@@ -48,10 +49,18 @@ struct hb_work_private_s
      /* Audio */
      hb_sync_audio_t sync_audio[8];
  
+    /* Flags */
+    int discontinuity;
+
      /* Statistics */
      uint64_t st_counts[4];
      uint64_t st_dates[4];
      uint64_t st_first;
+
+    /* Throttle message flags */
+    int   trashing_audio;
+    int   inserting_silence;
+    int   way_out_of_sync;
  };
  
  /***********************************************************************
@@ -85,6 +94,12 @@ int syncInit( hb_work_object_t * w, hb_job_t * job )
      pv->pts_offset_old = INT64_MIN;
      pv->count_frames   = 0;
  
+    pv->discontinuity = 0;
+
+    pv->trashing_audio = 0;
+    pv->inserting_silence = 0;
+    pv->way_out_of_sync = 0;
+
      /* Calculate how many video frames we are expecting */
      duration = 0;
      for( i = job->chapter_start; i <= job->chapter_end; i++ )
@@ -129,7 +144,8 @@ void syncClose( hb_work_object_t * w )
  
      for( i = 0; i < hb_list_count( title->list_audio ); i++ )
      {
-        if( job->acodec & HB_ACODEC_AC3 )
+        if( job->acodec & HB_ACODEC_AC3 ||
+            job->audio_mixdowns[i] == HB_AMIXDOWN_AC3 )
          {
              free( pv->sync_audio[i].ac3_buf );
          }
@@ -191,7 +207,8 @@ static void InitAudio( hb_work_object_t * w, int i )
      sync        = &pv->sync_audio[i];
      sync->audio = hb_list_item( title->list_audio, i );
  
-    if( job->acodec & HB_ACODEC_AC3 )
+    if( job->acodec & HB_ACODEC_AC3 ||
+        job->audio_mixdowns[i] == HB_AMIXDOWN_AC3 )
      {
          /* Have a silent AC-3 frame ready in case we have to fill a
             gap */
@@ -303,7 +320,6 @@ static int SyncVideo( hb_work_object_t * w )
          }
  
          /*
-
           * Track the video sequence number localy so that we can sync the audio
           * to it using the sequence number as well as the PTS.
           */
@@ -313,8 +329,8 @@ static int SyncVideo( hb_work_object_t * w )
          if( next->start < cur->start - PTS_DISCONTINUITY_TOLERANCE ||
              next->start > cur->start + PTS_DISCONTINUITY_TOLERANCE )
          {
-           hb_log( "Sync: Video PTS discontinuity (current buffer start=%lld, next buffer start=%lld), trash Video",
-                    cur->start, next->start );
+           hb_log( "Sync: Video PTS discontinuity %s (current buffer start=%lld, next buffer start=%lld)",
+                    pv->discontinuity ? "second" : "first", cur->start, next->start );
              
              /*
               * Do we need to trash the subtitle, is it from the next->start period
@@ -350,8 +366,18 @@ static int SyncVideo( hb_work_object_t * w )
  
              /* Calculate new offset */
              pv->pts_offset_old = pv->pts_offset;
-            pv->pts_offset     = cur->start -
-                pv->count_frames * pv->job->vrate_base / 300;
+            if ( job->vfr )
+            {
+                pv->pts_offset = cur->start - pv->next_start;
+            } else {
+                pv->pts_offset = cur->start -
+                    pv->count_frames * pv->job->vrate_base / 300;
+            }
+
+            if( !pv->discontinuity )
+            {
+                pv->discontinuity = 1;
+            }
  
              pv->video_sequence = cur->sequence;
              continue;
@@ -487,48 +513,72 @@ static int SyncVideo( hb_work_object_t * w )
              }
          }
  
-        /* The PTS of the frame we are expecting now */
-        pts_expected = pv->pts_offset +
-            pv->count_frames * pv->job->vrate_base / 300;
-
-        //hb_log("Video expecting PTS %lld, current frame: %lld, next frame: %lld, cf: %lld", 
-        //       pts_expected, cur->start, next->start, pv->count_frames * pv->job->vrate_base / 300 );
-
-        if( cur->start < pts_expected - pv->job->vrate_base / 300 / 2 &&
-            next->start < pts_expected + pv->job->vrate_base / 300 / 2 )
+        if ( job->vfr )
          {
-            /* The current frame is too old but the next one matches,
-               let's trash */
-            /* Also, make sure we don't trash a chapter break */
-            chap_break = cur->new_chap;
-            hb_buffer_close( &cur );
+            /*
+             * adjust the pts of the current frame so that it's contiguous
+             * with the previous frame. pts_offset tracks the time difference
+             * between the pts values in the input content (which start at some
+             * random time) and our timestamps (which start at zero). We don't
+             * make any adjustments to the source timestamps other than removing
+             * the clock offsets (which also removes pts discontinuities).
+             * This means we automatically encode at the source's frame rate.
+             * MP2 uses an implicit duration (frames end when the next frame
+             * starts) but more advanced containers like MP4 use an explicit
+             * duration. Since we're looking ahead one frame we set the
+             * explicit stop time from the start time of the next frame.
+             */
+            buf_tmp = cur;
              pv->cur = cur = hb_fifo_get( job->fifo_raw );
-            cur->new_chap |= chap_break; // Make sure we don't stomp the existing one.
-            
-            continue;
-        }
-
-        if( next->start > pts_expected + 3 * pv->job->vrate_base / 300 / 2 )
-        {
-            /* We'll need the current frame more than one time. Make a
-               copy of it and keep it */
-            buf_tmp = hb_buffer_init( cur->size );
-            memcpy( buf_tmp->data, cur->data, cur->size ); 
-            buf_tmp->sequence = cur->sequence;
+            buf_tmp->start = pv->next_start;
+            pv->next_start = next->start - pv->pts_offset;
+            buf_tmp->stop = pv->next_start;
          }
          else
          {
-            /* The frame has the expected date and won't have to be
-               duplicated, just put it through */
-            buf_tmp = cur;
-            pv->cur = cur = hb_fifo_get( job->fifo_raw );
+            /* The PTS of the frame we are expecting now */
+            pts_expected = pv->pts_offset +
+                pv->count_frames * pv->job->vrate_base / 300;
+
+            //hb_log("Video expecting PTS %lld, current frame: %lld, next frame: %lld, cf: %lld", 
+            //       pts_expected, cur->start, next->start, pv->count_frames * pv->job->vrate_base / 300 );
+
+            if( cur->start < pts_expected - pv->job->vrate_base / 300 / 2 &&
+                next->start < pts_expected + pv->job->vrate_base / 300 / 2 )
+            {
+                /* The current frame is too old but the next one matches,
+                   let's trash */
+                /* Also, make sure we don't trash a chapter break */
+                chap_break = cur->new_chap;
+                hb_buffer_close( &cur );
+                pv->cur = cur = hb_fifo_get( job->fifo_raw );
+                cur->new_chap |= chap_break; // Make sure we don't stomp the existing one.
+                
+                continue;
+            }
+
+            if( next->start > pts_expected + 3 * pv->job->vrate_base / 300 / 2 )
+            {
+                /* We'll need the current frame more than one time. Make a
+                   copy of it and keep it */
+                buf_tmp = hb_buffer_init( cur->size );
+                memcpy( buf_tmp->data, cur->data, cur->size ); 
+                buf_tmp->sequence = cur->sequence;
+            }
+            else
+            {
+                /* The frame has the expected date and won't have to be
+                   duplicated, just put it through */
+                buf_tmp = cur;
+                pv->cur = cur = hb_fifo_get( job->fifo_raw );
+            }
+            
+            /* Replace those MPEG-2 dates with our dates */
+            buf_tmp->start = (uint64_t) pv->count_frames *
+                pv->job->vrate_base / 300;
+            buf_tmp->stop  = (uint64_t) ( pv->count_frames + 1 ) *
+                pv->job->vrate_base / 300;
          }
-        
-        /* Replace those MPEG-2 dates with our dates */
-        buf_tmp->start = (uint64_t) pv->count_frames *
-            pv->job->vrate_base / 300;
-        buf_tmp->stop  = (uint64_t) ( pv->count_frames + 1 ) *
-            pv->job->vrate_base / 300;
  
          /* If we have a subtitle for this picture, copy it */
          /* FIXME: we should avoid this memcpy */
@@ -549,9 +599,9 @@ static int SyncVideo( hb_work_object_t * w )
          UpdateState( w );
  
          /* Make sure we won't get more frames then expected */
-        if( pv->count_frames >= pv->count_frames_max )
+        if( pv->count_frames >= pv->count_frames_max * 2)
          {
-            hb_log( "sync: got %lld frames", pv->count_frames );
+            hb_log( "sync: got too many frames (%lld), exiting early", pv->count_frames );
              pv->done = 1;
              
             // Drop an empty buffer into our output to ensure that things
@@ -589,7 +639,8 @@ static void SyncAudio( hb_work_object_t * w, int i )
      sync   = &pv->sync_audio[i];
      audio  = sync->audio;
  
-    if( job->acodec & HB_ACODEC_AC3 )
+    if( job->acodec & HB_ACODEC_AC3 ||
+        job->audio_mixdowns[i] == HB_AMIXDOWN_AC3 )
      {
          fifo = audio->fifo_out;
          rate = audio->rate;
@@ -607,27 +658,52 @@ static void SyncAudio( hb_work_object_t * w, int i )
          pts_expected = pv->pts_offset + sync->count_frames * 90000 / rate;
  
          // hb_log("Video Sequence: %lld, Audio Sequence: %lld", pv->video_sequence, buf->sequence);
+
          /*
           * Using the same logic as the Video have we crossed a VOB
           * boundary as detected by the expected PTS and the PTS of our
           * audio being out by more than the tolerance value.
           */
-        if( ( buf->start > pts_expected + PTS_DISCONTINUITY_TOLERANCE ||
-              buf->start < pts_expected - PTS_DISCONTINUITY_TOLERANCE ) &&
-            pv->pts_offset_old > INT64_MIN )
+        if( buf->start > pts_expected + PTS_DISCONTINUITY_TOLERANCE ||
+            buf->start < pts_expected - PTS_DISCONTINUITY_TOLERANCE )
          {
-           /*
-             * Useful debug, but too verbose for normal use.
-             */
-            hb_log("Sync: Audio discontinuity (sequence: vid %lld aud %lld) (pts %lld < %lld < %lld)",
-                   pv->video_sequence, buf->sequence,
-                  pts_expected - PTS_DISCONTINUITY_TOLERANCE, buf->start,
-                  pts_expected + PTS_DISCONTINUITY_TOLERANCE );
-           
              /* There has been a PTS discontinuity, and this frame might
                 be from before the discontinuity*/
-            pts_expected = pv->pts_offset_old + sync->count_frames *
-                90000 / rate;
+
+            if( pv->discontinuity )
+            {
+                /*
+                 * There is an outstanding discontinuity, so use the offset from 
+                 * that discontinuity.
+                 */
+                pts_expected = pv->pts_offset_old + sync->count_frames *
+                    90000 / rate;
+            }
+            else
+            {
+                /*
+                 * No outstanding discontinuity, so the audio must be leading the
+                 * video (or the PTS values are really stuffed). So lets mark this
+                 * as a discontinuity ourselves for the audio to use until
+                 * the video also crosses the discontinuity.
+                 *
+                 * pts_offset is used when we are in the same time space as the video
+                 * pts_offset_old when in a discontinuity.
+                 *
+                 * Therefore set the pts_offset_old given the new pts_offset for this
+                 * current buffer.
+                 */
+                pv->discontinuity = 1;
+                pv->pts_offset_old = buf->start - sync->count_frames *
+                    90000 / rate;
+                pts_expected = pv->pts_offset_old + sync->count_frames *
+                    90000 / rate;
+
+                hb_log("Sync: Audio discontinuity (sequence: vid %lld aud %lld) (pts %lld < %lld < %lld)",
+                       pv->video_sequence, buf->sequence,
+                       pts_expected - PTS_DISCONTINUITY_TOLERANCE, buf->start,
+                       pts_expected + PTS_DISCONTINUITY_TOLERANCE );
+            }
  
              /*
               * Is the audio from a valid period given the previous
@@ -651,7 +727,11 @@ static void SyncAudio( hb_work_object_t * w, int i )
                   * up diverging even more. We need to hold on to the
                   * audio until the video catches up.
                   */
-                hb_log("Sync: Audio is way out of sync, attempt to reconverge from current video PTS");
+                if( !pv->way_out_of_sync )
+                {
+                    hb_log("Sync: Audio is way out of sync, attempt to reconverge from current video PTS");
+                    pv->way_out_of_sync = 1;
+                }
                 
                  /*
                   * It wasn't from the old place, so we must be from
@@ -669,14 +749,28 @@ static void SyncAudio( hb_work_object_t * w, int i )
          else
          {
              start = pts_expected - pv->pts_offset;
+
+            if( pv->discontinuity )
+            {
+                /*
+                 * The Audio is tracking the Video again using the normal pts_offset, so the
+                 * discontinuity is over.
+                 */
+                hb_log( "Sync: Audio joined Video after discontinuity at PTS %lld", buf->start );
+                pv->discontinuity = 0;
+            }
          }
  
          /* Tolerance: 100 ms */
          if( buf->start < pts_expected - 9000 )
          {
-           /* Audio is behind the Video, trash it, can't use it now. */
-           hb_log( "Sync: Audio PTS (%lld) < Video PTS (%lld) by greater than 100ms, trashing audio to reconverge",
-                     buf->start, pts_expected);
+            if( !pv->trashing_audio )
+            {
+                /* Audio is behind the Video, trash it, can't use it now. */
+                hb_log( "Sync: Audio PTS (%lld) < Video PTS (%lld) by greater than 100ms, trashing audio to reconverge",
+                        buf->start, pts_expected);
+                pv->trashing_audio = 1;
+            }
              buf = hb_fifo_get( audio->fifo_raw );
              hb_buffer_close( &buf );
              continue;
@@ -684,12 +778,32 @@ static void SyncAudio( hb_work_object_t * w, int i )
          else if( buf->start > pts_expected + 9000 )
          {
              /* Audio is ahead of the Video, insert silence until we catch up*/
-           hb_log("Sync: Audio PTS (%lld) >  Video PTS (%lld) by greater than 100ms insert silence until reconverged", buf->start, pts_expected);
+            if( !pv->inserting_silence )
+            {
+                hb_log("Sync: Audio PTS (%lld) >  Video PTS (%lld) by greater than 100ms insert silence until reconverged", buf->start, pts_expected);
+                pv->inserting_silence = 1;
+            }
              InsertSilence( w, i );
              continue;
+        } 
+        else 
+        {
+            if( pv->trashing_audio || pv->inserting_silence )
+            {
+                hb_log( "Sync: Audio back in Sync at PTS %lld", buf->start );
+                pv->trashing_audio = 0;
+                pv->inserting_silence = 0;
+            }
+            if( pv->way_out_of_sync )
+            {
+                hb_log( "Sync: Audio no longer way out of sync at PTS %lld",
+                        buf->start );
+                pv->way_out_of_sync = 0;
+            }
          }
  
-        if( job->acodec & HB_ACODEC_AC3 )
+        if( job->acodec & HB_ACODEC_AC3 ||
+            job->audio_mixdowns[i] == HB_AMIXDOWN_AC3 )
          {
              buf        = hb_fifo_get( audio->fifo_raw );
              buf->start = start;
@@ -741,6 +855,16 @@ static void SyncAudio( hb_work_object_t * w, int i )
          hb_fifo_push( fifo, buf );
      }
  
+    if( hb_fifo_is_full( fifo ) &&
+        pv->way_out_of_sync ) 
+    {
+        /*
+         * Trash the top audio packet to avoid dead lock as we reconverge.
+         */
+        if ( (buf = hb_fifo_get( audio->fifo_raw ) ) != NULL)
+            hb_buffer_close( &buf );
+    }
+
      if( NeedSilence( w, audio ) )
      {
          InsertSilence( w, i );
@@ -795,7 +919,8 @@ static void InsertSilence( hb_work_object_t * w, int i )
      job    = pv->job;
      sync   = &pv->sync_audio[i];
  
-    if( job->acodec & HB_ACODEC_AC3 )
+    if( job->acodec & HB_ACODEC_AC3 ||
+        job->audio_mixdowns[i] == HB_AMIXDOWN_AC3 )
      {
          buf        = hb_buffer_init( sync->ac3_size );
          buf->start = sync->count_frames * 90000 / sync->audio->rate;
@@ -818,8 +943,6 @@ static void InsertSilence( hb_work_object_t * w, int i )
          buf->stop  = buf->start + 90000 / 20;
          memset( buf->data, 0, buf->size );
  
-        hb_log( "sync: adding 50 ms of silence for track %x",
-                sync->audio->id );
          hb_fifo_push( sync->audio->fifo_sync, buf );
  
          sync->count_frames += job->arate / 20;